{
 "cells": [
  {
   "cell_type": "code",
   "execution_count": 1,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-1-8ae4025e7ff4>:19: DeprecationWarning: use options instead of chrome_options\n",
      "  driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,\n"
     ]
    }
   ],
   "source": [
    "from selenium import webdriver\n",
    "from selenium.webdriver.common.desired_capabilities import DesiredCapabilities\n",
    "\n",
    "\n",
    "#caps=dict()\n",
    "#caps[\"pageLoadStrategy\"] = \"none\"   # Do not wait for full page load\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')#解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') #指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') #谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') #隐藏滚动条, 应对些特殊页面\n",
    "#opts.add_argument('blink-settings=imagesEnabled=false') #不加载图片, 提升速度\n",
    "#opts.add_argument('--headless') #浏览器不提供可视化页面. linux下如果系统不支持可视化不加这条会启动失败\n",
    "# opts.binary_location = \"C:\\portable\\PortableApps\\IronPortable\\App\\Iron\\chrome.exe\"\n",
    "# opts.binary_location = \"C:\\Program Files\\Google\\Chrome\\Application\\chromedriver.exe\" #\"H:\\_coding_\\Gitee\\InternetNewMedia\\CapstonePrj2016\\chromedriver.exe\"  \n",
    "\n",
    "\n",
    "driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps,"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 打开知网（校园网自动登录）"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 2,
   "metadata": {},
   "outputs": [],
   "source": [
    "driver.get('https://cnki.net')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 检查"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 3,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'中山大学南...'"
      ]
     },
     "execution_count": 3,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "driver.find_element_by_id('Ecp_loginShowName1').get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 打开高级检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 4,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_id('highSearch')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 检查窗口\n",
    "* 当出现多个窗口，请检查窗口信息\n",
    "* 窗口信息根据窗口加载的顺序按照列表存储，每一个窗口又唯一识别的窗口ID"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 5,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'CDwindow-C75A27B0B67D805DDC892DB2ECD948F6'"
      ]
     },
     "execution_count": 5,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看当前窗口\n",
    "driver.current_window_handle"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 6,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-C75A27B0B67D805DDC892DB2ECD948F6',\n",
       " 'CDwindow-C1CAFA10717FF53C58BFD87722DEC54D']"
      ]
     },
     "execution_count": 6,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看所有窗口\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 7,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-7-704fdf3805c1>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "# 切换窗口\n",
    "driver.switch_to_window(driver.window_handles[1])"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 点击学术期刊"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 8,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//ul[@class=\"doctype-menus keji\"]/li[@data-id=\"xsqk\"]/a')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 点击专业检索"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 9,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('/html/body/div[2]/div/div[2]/ul/li[4]')\n",
    "element.get_attribute('innerHTML')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 勾选来源类别"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 10,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"EI\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 11,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 北大核心\n",
    "element = driver.find_element_by_xpath('//input[@key=\"HX\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 12,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"CSI\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 13,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"SI\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 14,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@key=\"CSD\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 设置搜索query"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 15,
   "metadata": {},
   "outputs": [],
   "source": [
    "# query = 'SU = \"新媒体\" AND (TI \"人工智能\" OR TI = \"大数据\" OR TI = \"big data\")'\n",
    "query = 'SU=\"人工智能\"'"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 16,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//textarea')\n",
    "element.clear()\n",
    "element.send_keys(query)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 17,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//input[@value=\"检索\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 检查检索信息 更换页面文章数量"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 18,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'共找到<em>26,123</em>条结果'"
      ]
     },
     "execution_count": 18,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 检查数量\n",
    "element = driver.find_element_by_xpath('//span[@class=\"pagerTitleCell\"]')\n",
    "element.get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 19,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//i[@class=\"icon icon-sort\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 20,
   "metadata": {},
   "outputs": [],
   "source": [
    "element = driver.find_element_by_xpath('//div[@id=\"perPageDiv\"]//li[@data-val=\"50\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 抓取页面数据"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 21,
   "metadata": {},
   "outputs": [],
   "source": [
    "import pandas as pd"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 22,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发</td>\n",
       "      <td>代林序; 张玉洁</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>关于智能化战争的基本认知  网络首发</td>\n",
       "      <td>郭明</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-07-02 15:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>卫星在轨故障案例与人工智能故障诊断  网络首发</td>\n",
       "      <td>王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬</td>\n",
       "      <td>中国空间科学技术</td>\n",
       "      <td>2021-07-02 08:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>高等职业教育智能生态系统:内涵、结构与实践路径</td>\n",
       "      <td>徐晔</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>近20年在线学习环境研究评述——基于LDA和DTM的动态分析</td>\n",
       "      <td>牛晓杰; 郑勤华</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>教育人工智能场域下教师角色与行动取向</td>\n",
       "      <td>赵磊磊; 马玉菲; 代蕊华</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>智能财务人才培养与浙江大学的探索  网络首发</td>\n",
       "      <td>陈俊; 董望</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 15:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>机器学习在智能配用电领域的应用：北美工程实践概述  网络首发</td>\n",
       "      <td>李亦言; 胡荣兴; 宋立冬; 贾乾罡; 陆宁</td>\n",
       "      <td>电力系统自动化</td>\n",
       "      <td>2021-07-01 09:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>国际经贸协定中的源代码规则新发展及中国立场  网络首发</td>\n",
       "      <td>鄢雨虹</td>\n",
       "      <td>武大国际法评论</td>\n",
       "      <td>2021-07-01 09:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>人工智能赋能高校数据治理：逻辑、挑战与实践  网络首发</td>\n",
       "      <td>赵磊磊</td>\n",
       "      <td>重庆高教研究</td>\n",
       "      <td>2021-06-30 14:14</td>\n",
       "      <td>NaN</td>\n",
       "      <td>114.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>嵌入式神经网络加速器及SoC芯片  网络首发</td>\n",
       "      <td>易冬柏; 陈恒; 何乐年</td>\n",
       "      <td>仪器仪表学报</td>\n",
       "      <td>2021-06-30 10:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>59.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>绿色理念下智慧零售创新发展路径</td>\n",
       "      <td>翟璇</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》</td>\n",
       "      <td>单浩耘</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>15.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>智能化金融监管：模型框架、边缘约束和实践策略  网络首发</td>\n",
       "      <td>乔宇锋</td>\n",
       "      <td>南方金融</td>\n",
       "      <td>2021-06-29 17:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>105.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>“智能+”时代的现代文化产业体系：挑战与重塑</td>\n",
       "      <td>解学芳; 雷文宣</td>\n",
       "      <td>深圳大学学报(人文社会科学版)</td>\n",
       "      <td>2021-06-29 15:45</td>\n",
       "      <td>NaN</td>\n",
       "      <td>65.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>人工智能在胸部创伤肋骨骨折CT诊断中应用的初步研究  网络首发</td>\n",
       "      <td>刘想;谢辉辉;许玉峰;陶晓峰;柳林</td>\n",
       "      <td>上海交通大学学报(医学版)</td>\n",
       "      <td>2021-06-29 14:47</td>\n",
       "      <td>NaN</td>\n",
       "      <td>38.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>人工智能技术在火电行业的应用探讨  网络首发</td>\n",
       "      <td>华志刚; 范佳卿; 郭荣; 汪勇; 吴潇翔</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2021-06-29 11:10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>127.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>基于切换输出机制的超短期风电功率预测  网络首发</td>\n",
       "      <td>杨茂; 许传宇; 王凯旋</td>\n",
       "      <td>高电压技术</td>\n",
       "      <td>2021-06-29 11:02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>23.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>DCN:双通道密集哈达玛卷积的画质评价网络  网络首发</td>\n",
       "      <td>杨晓东; 韩振奇; 刘立庄; 赵丹</td>\n",
       "      <td>计算机工程与应用</td>\n",
       "      <td>2021-06-29 09:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>26.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>智能交通管理系统发展趋势  网络首发</td>\n",
       "      <td>李瑞敏; 王长君</td>\n",
       "      <td>清华大学学报(自然科学版)</td>\n",
       "      <td>2021-06-29 08:59</td>\n",
       "      <td>NaN</td>\n",
       "      <td>94.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>人工智能写作背景下作者主体性的消解与重构——以陈楸帆人机交互写作实验为中心</td>\n",
       "      <td>周建琼</td>\n",
       "      <td>当代文坛</td>\n",
       "      <td>2021-06-29</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>空气源热泵除霜控制方法研究现状及展望  网络首发</td>\n",
       "      <td>王沣浩; 马龙霞; 王志华; 楼业春; 刘孜璇</td>\n",
       "      <td>制冷学报</td>\n",
       "      <td>2021-06-28 10:21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>面向机器人自主分割的肉品识别分类系统实现  网络首发</td>\n",
       "      <td>马欢; 冀晶晶; 刘佳豪; 刘雨婷</td>\n",
       "      <td>图学学报</td>\n",
       "      <td>2021-06-28 08:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>150.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>AI辅助头颈CTA在诊断颅内动脉瘤中的应用</td>\n",
       "      <td>邓昊;韦鑫;曹闻挺;艾光勇;余菡</td>\n",
       "      <td>第三军医大学学报</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>人工智能模型预测输尿管结石自然排出的多中心临床试验的验证研究</td>\n",
       "      <td>曾凯; 王新敏; 倪钊; 王勤章; 李强</td>\n",
       "      <td>中国全科医学</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>城市暴雨内涝综述：特征、机理、数据与方法</td>\n",
       "      <td>黄华兵; 王先伟; 柳林</td>\n",
       "      <td>地理科学进展</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>基于计算机视觉的织物光泽测试方法研究  网络首发</td>\n",
       "      <td>张建新; 黄钢; 李消晋</td>\n",
       "      <td>丝绸</td>\n",
       "      <td>2021-06-25 17:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>271.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>MIT Technology Review 2021年“十大突破性技术”解读  网络首发</td>\n",
       "      <td>祁海;张民;李俊涛;张小松;张强</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-06-25 17:07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>140.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>基于区块链的联邦学习技术综述  网络首发</td>\n",
       "      <td>李凌霄;袁莎;金银玉</td>\n",
       "      <td>计算机应用研究</td>\n",
       "      <td>2021-06-25 16:23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>365.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>竞技二打一游戏中同等牌力的研究  网络首发</td>\n",
       "      <td>李淑琴; 陈子鹏; 郑蓝舟; 孟坤</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-25 16:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>84.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>新信息技术对高等教育影响的演变及反思——基于2004-2021年《地平线报告》内容分析  网络首发</td>\n",
       "      <td>梁志星; 冯兴杰; 李佳; 杨珂</td>\n",
       "      <td>当代教育论坛</td>\n",
       "      <td>2021-06-25 16:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>199.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>机器人示教学习与技能泛化实验设计</td>\n",
       "      <td>占宏; 李娴; 杨辰光</td>\n",
       "      <td>实验技术与管理</td>\n",
       "      <td>2021-06-25 15:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>79.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>CoTransH: 科技文献知识图谱中语义关系预测的翻译模型  网络首发</td>\n",
       "      <td>陶玥; 余丽; 吴振新</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-25 11:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>88.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>管道数字孪生体模型的构建及应用</td>\n",
       "      <td>陈斯迅;李在蓉;王禹钦;关红亮;高丽</td>\n",
       "      <td>油气储运</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>220.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>清华大学TH-Health研究室简介</td>\n",
       "      <td>NaN</td>\n",
       "      <td>针刺研究</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>大数据智能时代地图学课程内容改革探索</td>\n",
       "      <td>刘慧敏; 邓敏; 刘宝举; 陈杰</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>机器人智能化焊接技术发展综述及其在运载火箭贮箱中的应用</td>\n",
       "      <td>林尚扬;杨学勤;徐爱杰;陈华斌;林涛</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>智能博弈趋势下未来空天防御体系展望</td>\n",
       "      <td>王波兰</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>13.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>未来智能化网络化多功能卫星系统技术发展思考</td>\n",
       "      <td>陈占胜</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>新型机械导航系统辅助穿刺初步实验研究</td>\n",
       "      <td>文艺; 李晓冰; 吴智群</td>\n",
       "      <td>介入放射学杂志</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>人机对抗智能技术最新进展及军事应用</td>\n",
       "      <td>聂凯; 曾科军; 孟庆海; 魏超</td>\n",
       "      <td>兵器装备工程学报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>29.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>人工智能时代高校翻译技术实践环境建设研究</td>\n",
       "      <td>曹达钦; 戴钰涵</td>\n",
       "      <td>外语界</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>融合视觉显著性再检测的孪生网络无人机目标跟踪算法  网络首发</td>\n",
       "      <td>周士琪; 王耀南; 钟杭</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-23 15:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>217.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>军事智能化的瓶颈与关键问题研究  网络首发</td>\n",
       "      <td>刘伟</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-06-23 14:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>80.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>思索·睿智:迷雾中的笃行要件——记第55次情报科学读书会</td>\n",
       "      <td>于伟; 苏鹏</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>多智能体协作场景下基于强化学习值分解的计算卸载策略  网络首发</td>\n",
       "      <td>张鹏; 田辉; 赵鹏涛; 贺硕; 童一帆</td>\n",
       "      <td>通信学报</td>\n",
       "      <td>2021-06-22 16:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>160.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>人工智能范式的革命与通用智能理论的创生  网络首发</td>\n",
       "      <td>钟义信</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-22 15:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>165.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>基于人工智能算法的作业现场人员设备资质识别技术研究  网络首发</td>\n",
       "      <td>陈晓江; 龙震岳; 曾纪钧</td>\n",
       "      <td>电测与仪表</td>\n",
       "      <td>2021-06-22 10:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>192.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                                 篇名  \\\n",
       "0            1    机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发   \n",
       "1            2                                 关于智能化战争的基本认知  网络首发   \n",
       "2            3                         金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "3            4                            卫星在轨故障案例与人工智能故障诊断  网络首发   \n",
       "4            5                            高等职业教育智能生态系统:内涵、结构与实践路径   \n",
       "5            6                     近20年在线学习环境研究评述——基于LDA和DTM的动态分析   \n",
       "6            7                                 教育人工智能场域下教师角色与行动取向   \n",
       "7            8                             智能财务人才培养与浙江大学的探索  网络首发   \n",
       "8            9                     机器学习在智能配用电领域的应用：北美工程实践概述  网络首发   \n",
       "9           10                        国际经贸协定中的源代码规则新发展及中国立场  网络首发   \n",
       "10          11                        人工智能赋能高校数据治理：逻辑、挑战与实践  网络首发   \n",
       "11          12                             嵌入式神经网络加速器及SoC芯片  网络首发   \n",
       "12          13                                    绿色理念下智慧零售创新发展路径   \n",
       "13          14                 数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》   \n",
       "14          15                       智能化金融监管：模型框架、边缘约束和实践策略  网络首发   \n",
       "15          16                             “智能+”时代的现代文化产业体系：挑战与重塑   \n",
       "16          17                    人工智能在胸部创伤肋骨骨折CT诊断中应用的初步研究  网络首发   \n",
       "17          18                             人工智能技术在火电行业的应用探讨  网络首发   \n",
       "18          19                           基于切换输出机制的超短期风电功率预测  网络首发   \n",
       "19          20                        DCN:双通道密集哈达玛卷积的画质评价网络  网络首发   \n",
       "20          21                                 智能交通管理系统发展趋势  网络首发   \n",
       "21          22              人工智能写作背景下作者主体性的消解与重构——以陈楸帆人机交互写作实验为中心   \n",
       "22          23                           空气源热泵除霜控制方法研究现状及展望  网络首发   \n",
       "23          24                         面向机器人自主分割的肉品识别分类系统实现  网络首发   \n",
       "24          25                              AI辅助头颈CTA在诊断颅内动脉瘤中的应用   \n",
       "25          26                     人工智能模型预测输尿管结石自然排出的多中心临床试验的验证研究   \n",
       "26          27                               城市暴雨内涝综述：特征、机理、数据与方法   \n",
       "27          28                           基于计算机视觉的织物光泽测试方法研究  网络首发   \n",
       "28          29       MIT Technology Review 2021年“十大突破性技术”解读  网络首发   \n",
       "29          30                               基于区块链的联邦学习技术综述  网络首发   \n",
       "30          31                              竞技二打一游戏中同等牌力的研究  网络首发   \n",
       "31          32  新信息技术对高等教育影响的演变及反思——基于2004-2021年《地平线报告》内容分析  网络首发   \n",
       "32          33                                   机器人示教学习与技能泛化实验设计   \n",
       "33          34               CoTransH: 科技文献知识图谱中语义关系预测的翻译模型  网络首发   \n",
       "34          35                                    管道数字孪生体模型的构建及应用   \n",
       "35          36                                 清华大学TH-Health研究室简介   \n",
       "36          37                                 大数据智能时代地图学课程内容改革探索   \n",
       "37          38                        机器人智能化焊接技术发展综述及其在运载火箭贮箱中的应用   \n",
       "38          39                                  智能博弈趋势下未来空天防御体系展望   \n",
       "39          40                              未来智能化网络化多功能卫星系统技术发展思考   \n",
       "40          41  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "41          42                                 新型机械导航系统辅助穿刺初步实验研究   \n",
       "42          43                                  人机对抗智能技术最新进展及军事应用   \n",
       "43          44                               人工智能时代高校翻译技术实践环境建设研究   \n",
       "44          45                     融合视觉显著性再检测的孪生网络无人机目标跟踪算法  网络首发   \n",
       "45          46                              军事智能化的瓶颈与关键问题研究  网络首发   \n",
       "46          47                       思索·睿智:迷雾中的笃行要件——记第55次情报科学读书会   \n",
       "47          48                    多智能体协作场景下基于强化学习值分解的计算卸载策略  网络首发   \n",
       "48          49                          人工智能范式的革命与通用智能理论的创生  网络首发   \n",
       "49          50                    基于人工智能算法的作业现场人员设备资质识别技术研究  网络首发   \n",
       "\n",
       "                         作者               刊名              发表时间  被引     下载  操作  \n",
       "0                  代林序; 张玉洁            档案与建设  2021-07-02 16:16 NaN    NaN  下载  \n",
       "1                        郭明        人民论坛·学术前沿  2021-07-02 15:49 NaN    NaN  下载  \n",
       "2             陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN    NaN  下载  \n",
       "3        王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬         中国空间科学技术  2021-07-02 08:49 NaN    NaN  下载  \n",
       "4                        徐晔           中国远程教育        2021-07-02 NaN    NaN  下载  \n",
       "5                  牛晓杰; 郑勤华           中国远程教育        2021-07-02 NaN    NaN  下载  \n",
       "6             赵磊磊; 马玉菲; 代蕊华           中国远程教育        2021-07-02 NaN    NaN  下载  \n",
       "7                    陈俊; 董望             财会月刊  2021-07-01 15:42 NaN    NaN  下载  \n",
       "8    李亦言; 胡荣兴; 宋立冬; 贾乾罡; 陆宁          电力系统自动化  2021-07-01 09:50 NaN    NaN  下载  \n",
       "9                       鄢雨虹          武大国际法评论  2021-07-01 09:16 NaN    NaN  下载  \n",
       "10                      赵磊磊           重庆高教研究  2021-06-30 14:14 NaN  114.0  下载  \n",
       "11             易冬柏; 陈恒; 何乐年           仪器仪表学报  2021-06-30 10:09 NaN   59.0  下载  \n",
       "12                       翟璇           商业经济研究        2021-06-30 NaN    6.0  下载  \n",
       "13                      单浩耘           商业经济研究        2021-06-30 NaN   15.0  下载  \n",
       "14                      乔宇锋             南方金融  2021-06-29 17:04 NaN  105.0  下载  \n",
       "15                 解学芳; 雷文宣  深圳大学学报(人文社会科学版)  2021-06-29 15:45 NaN   65.0  下载  \n",
       "16        刘想;谢辉辉;许玉峰;陶晓峰;柳林    上海交通大学学报(医学版)  2021-06-29 14:47 NaN   38.0  下载  \n",
       "17    华志刚; 范佳卿; 郭荣; 汪勇; 吴潇翔             中国电力  2021-06-29 11:10 NaN  127.0  下载  \n",
       "18             杨茂; 许传宇; 王凯旋            高电压技术  2021-06-29 11:02 NaN   23.0  下载  \n",
       "19        杨晓东; 韩振奇; 刘立庄; 赵丹         计算机工程与应用  2021-06-29 09:20 NaN   26.0  下载  \n",
       "20                 李瑞敏; 王长君    清华大学学报(自然科学版)  2021-06-29 08:59 NaN   94.0  下载  \n",
       "21                      周建琼             当代文坛        2021-06-29 NaN   28.0  下载  \n",
       "22  王沣浩; 马龙霞; 王志华; 楼业春; 刘孜璇             制冷学报  2021-06-28 10:21 NaN   60.0  下载  \n",
       "23        马欢; 冀晶晶; 刘佳豪; 刘雨婷             图学学报  2021-06-28 08:48 NaN  150.0  下载  \n",
       "24         邓昊;韦鑫;曹闻挺;艾光勇;余菡         第三军医大学学报        2021-06-28 NaN    6.0  下载  \n",
       "25     曾凯; 王新敏; 倪钊; 王勤章; 李强           中国全科医学        2021-06-28 NaN   18.0  下载  \n",
       "26             黄华兵; 王先伟; 柳林           地理科学进展        2021-06-28 NaN    NaN  下载  \n",
       "27             张建新; 黄钢; 李消晋               丝绸  2021-06-25 17:11 NaN  271.0  下载  \n",
       "28         祁海;张民;李俊涛;张小松;张强           中国科学基金  2021-06-25 17:07 NaN  140.0  下载  \n",
       "29               李凌霄;袁莎;金银玉          计算机应用研究  2021-06-25 16:23 NaN  365.0  下载  \n",
       "30        李淑琴; 陈子鹏; 郑蓝舟; 孟坤           智能系统学报  2021-06-25 16:03 NaN   84.0  下载  \n",
       "31         梁志星; 冯兴杰; 李佳; 杨珂           当代教育论坛  2021-06-25 16:03 NaN  199.0  下载  \n",
       "32              占宏; 李娴; 杨辰光          实验技术与管理  2021-06-25 15:39 NaN   79.0  下载  \n",
       "33              陶玥; 余丽; 吴振新          情报理论与实践  2021-06-25 11:16 NaN   88.0  下载  \n",
       "34       陈斯迅;李在蓉;王禹钦;关红亮;高丽             油气储运        2021-06-25 NaN  220.0  下载  \n",
       "35                      NaN             针刺研究        2021-06-25 NaN   18.0  下载  \n",
       "36         刘慧敏; 邓敏; 刘宝举; 陈杰             测绘通报        2021-06-25 NaN   24.0  下载  \n",
       "37       林尚扬;杨学勤;徐爱杰;陈华斌;林涛        上海航天(中英文)        2021-06-25 NaN   24.0  下载  \n",
       "38                      王波兰        上海航天(中英文)        2021-06-25 NaN   13.0  下载  \n",
       "39                      陈占胜        上海航天(中英文)        2021-06-25 NaN    9.0  下载  \n",
       "40                      张诗雨             锻压技术        2021-06-25 NaN    6.0  下载  \n",
       "41             文艺; 李晓冰; 吴智群          介入放射学杂志        2021-06-25 NaN    1.0  下载  \n",
       "42         聂凯; 曾科军; 孟庆海; 魏超         兵器装备工程学报        2021-06-25 NaN   29.0  下载  \n",
       "43                 曹达钦; 戴钰涵              外语界        2021-06-25 NaN    NaN  下载  \n",
       "44             周士琪; 王耀南; 钟杭           智能系统学报  2021-06-23 15:11 NaN  217.0  下载  \n",
       "45                       刘伟        人民论坛·学术前沿  2021-06-23 14:04 NaN   80.0  下载  \n",
       "46                   于伟; 苏鹏          情报理论与实践        2021-06-23 NaN   19.0  下载  \n",
       "47     张鹏; 田辉; 赵鹏涛; 贺硕; 童一帆             通信学报  2021-06-22 16:50 NaN  160.0  下载  \n",
       "48                      钟义信           智能系统学报  2021-06-22 15:09 NaN  165.0  下载  \n",
       "49            陈晓江; 龙震岳; 曾纪钧            电测与仪表  2021-06-22 10:38 NaN  192.0  下载  "
      ]
     },
     "execution_count": 22,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element=driver.find_element_by_id('gridTable')\n",
    "页面_表格_html=element.get_attribute('innerHTML')\n",
    "pd.read_html(页面_表格_html)[0]"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 详细页链接"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 23,
   "metadata": {},
   "outputs": [],
   "source": [
    "import re\n",
    "from lxml.html import fromstring"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "html = driver.page_source\n",
    "root = fromstring(html)\n",
    "href = [x for x in root.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')]\n",
    "\n",
    "def correct(href):\n",
    "    DbCode = re.findall(\"DbCode=(.*?)&\",href)[0]\n",
    "    dbname = re.findall(\"dbname=(.*?)&\",href)[0]\n",
    "    filename = re.findall(\"filename=(.*?)&\",href)[0]\n",
    "    href = f\"https://kns.cnki.net/kcms/detail/detail.aspx?dbcode={DbCode}&dbname={dbname}&filename={filename}\"\n",
    "    return href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 25,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发</td>\n",
       "      <td>代林序; 张玉洁</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>关于智能化战争的基本认知  网络首发</td>\n",
       "      <td>郭明</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-07-02 15:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>卫星在轨故障案例与人工智能故障诊断  网络首发</td>\n",
       "      <td>王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬</td>\n",
       "      <td>中国空间科学技术</td>\n",
       "      <td>2021-07-02 08:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>高等职业教育智能生态系统:内涵、结构与实践路径</td>\n",
       "      <td>徐晔</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>近20年在线学习环境研究评述——基于LDA和DTM的动态分析</td>\n",
       "      <td>牛晓杰; 郑勤华</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>教育人工智能场域下教师角色与行动取向</td>\n",
       "      <td>赵磊磊; 马玉菲; 代蕊华</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>智能财务人才培养与浙江大学的探索  网络首发</td>\n",
       "      <td>陈俊; 董望</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 15:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>机器学习在智能配用电领域的应用：北美工程实践概述  网络首发</td>\n",
       "      <td>李亦言; 胡荣兴; 宋立冬; 贾乾罡; 陆宁</td>\n",
       "      <td>电力系统自动化</td>\n",
       "      <td>2021-07-01 09:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>国际经贸协定中的源代码规则新发展及中国立场  网络首发</td>\n",
       "      <td>鄢雨虹</td>\n",
       "      <td>武大国际法评论</td>\n",
       "      <td>2021-07-01 09:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>人工智能赋能高校数据治理：逻辑、挑战与实践  网络首发</td>\n",
       "      <td>赵磊磊</td>\n",
       "      <td>重庆高教研究</td>\n",
       "      <td>2021-06-30 14:14</td>\n",
       "      <td>NaN</td>\n",
       "      <td>114.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>嵌入式神经网络加速器及SoC芯片  网络首发</td>\n",
       "      <td>易冬柏; 陈恒; 何乐年</td>\n",
       "      <td>仪器仪表学报</td>\n",
       "      <td>2021-06-30 10:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>59.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>绿色理念下智慧零售创新发展路径</td>\n",
       "      <td>翟璇</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》</td>\n",
       "      <td>单浩耘</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>15.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>智能化金融监管：模型框架、边缘约束和实践策略  网络首发</td>\n",
       "      <td>乔宇锋</td>\n",
       "      <td>南方金融</td>\n",
       "      <td>2021-06-29 17:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>105.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>“智能+”时代的现代文化产业体系：挑战与重塑</td>\n",
       "      <td>解学芳; 雷文宣</td>\n",
       "      <td>深圳大学学报(人文社会科学版)</td>\n",
       "      <td>2021-06-29 15:45</td>\n",
       "      <td>NaN</td>\n",
       "      <td>65.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>人工智能在胸部创伤肋骨骨折CT诊断中应用的初步研究  网络首发</td>\n",
       "      <td>刘想;谢辉辉;许玉峰;陶晓峰;柳林</td>\n",
       "      <td>上海交通大学学报(医学版)</td>\n",
       "      <td>2021-06-29 14:47</td>\n",
       "      <td>NaN</td>\n",
       "      <td>38.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>人工智能技术在火电行业的应用探讨  网络首发</td>\n",
       "      <td>华志刚; 范佳卿; 郭荣; 汪勇; 吴潇翔</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2021-06-29 11:10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>127.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>基于切换输出机制的超短期风电功率预测  网络首发</td>\n",
       "      <td>杨茂; 许传宇; 王凯旋</td>\n",
       "      <td>高电压技术</td>\n",
       "      <td>2021-06-29 11:02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>23.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>DCN:双通道密集哈达玛卷积的画质评价网络  网络首发</td>\n",
       "      <td>杨晓东; 韩振奇; 刘立庄; 赵丹</td>\n",
       "      <td>计算机工程与应用</td>\n",
       "      <td>2021-06-29 09:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>26.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>智能交通管理系统发展趋势  网络首发</td>\n",
       "      <td>李瑞敏; 王长君</td>\n",
       "      <td>清华大学学报(自然科学版)</td>\n",
       "      <td>2021-06-29 08:59</td>\n",
       "      <td>NaN</td>\n",
       "      <td>94.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>人工智能写作背景下作者主体性的消解与重构——以陈楸帆人机交互写作实验为中心</td>\n",
       "      <td>周建琼</td>\n",
       "      <td>当代文坛</td>\n",
       "      <td>2021-06-29</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>空气源热泵除霜控制方法研究现状及展望  网络首发</td>\n",
       "      <td>王沣浩; 马龙霞; 王志华; 楼业春; 刘孜璇</td>\n",
       "      <td>制冷学报</td>\n",
       "      <td>2021-06-28 10:21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>面向机器人自主分割的肉品识别分类系统实现  网络首发</td>\n",
       "      <td>马欢; 冀晶晶; 刘佳豪; 刘雨婷</td>\n",
       "      <td>图学学报</td>\n",
       "      <td>2021-06-28 08:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>150.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>AI辅助头颈CTA在诊断颅内动脉瘤中的应用</td>\n",
       "      <td>邓昊;韦鑫;曹闻挺;艾光勇;余菡</td>\n",
       "      <td>第三军医大学学报</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>人工智能模型预测输尿管结石自然排出的多中心临床试验的验证研究</td>\n",
       "      <td>曾凯; 王新敏; 倪钊; 王勤章; 李强</td>\n",
       "      <td>中国全科医学</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>城市暴雨内涝综述：特征、机理、数据与方法</td>\n",
       "      <td>黄华兵; 王先伟; 柳林</td>\n",
       "      <td>地理科学进展</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>基于计算机视觉的织物光泽测试方法研究  网络首发</td>\n",
       "      <td>张建新; 黄钢; 李消晋</td>\n",
       "      <td>丝绸</td>\n",
       "      <td>2021-06-25 17:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>271.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>MIT Technology Review 2021年“十大突破性技术”解读  网络首发</td>\n",
       "      <td>祁海;张民;李俊涛;张小松;张强</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-06-25 17:07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>140.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>基于区块链的联邦学习技术综述  网络首发</td>\n",
       "      <td>李凌霄;袁莎;金银玉</td>\n",
       "      <td>计算机应用研究</td>\n",
       "      <td>2021-06-25 16:23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>365.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>竞技二打一游戏中同等牌力的研究  网络首发</td>\n",
       "      <td>李淑琴; 陈子鹏; 郑蓝舟; 孟坤</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-25 16:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>84.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>新信息技术对高等教育影响的演变及反思——基于2004-2021年《地平线报告》内容分析  网络首发</td>\n",
       "      <td>梁志星; 冯兴杰; 李佳; 杨珂</td>\n",
       "      <td>当代教育论坛</td>\n",
       "      <td>2021-06-25 16:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>199.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>机器人示教学习与技能泛化实验设计</td>\n",
       "      <td>占宏; 李娴; 杨辰光</td>\n",
       "      <td>实验技术与管理</td>\n",
       "      <td>2021-06-25 15:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>79.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>CoTransH: 科技文献知识图谱中语义关系预测的翻译模型  网络首发</td>\n",
       "      <td>陶玥; 余丽; 吴振新</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-25 11:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>88.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>管道数字孪生体模型的构建及应用</td>\n",
       "      <td>陈斯迅;李在蓉;王禹钦;关红亮;高丽</td>\n",
       "      <td>油气储运</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>220.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>清华大学TH-Health研究室简介</td>\n",
       "      <td>NaN</td>\n",
       "      <td>针刺研究</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>大数据智能时代地图学课程内容改革探索</td>\n",
       "      <td>刘慧敏; 邓敏; 刘宝举; 陈杰</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>机器人智能化焊接技术发展综述及其在运载火箭贮箱中的应用</td>\n",
       "      <td>林尚扬;杨学勤;徐爱杰;陈华斌;林涛</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>智能博弈趋势下未来空天防御体系展望</td>\n",
       "      <td>王波兰</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>13.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>未来智能化网络化多功能卫星系统技术发展思考</td>\n",
       "      <td>陈占胜</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>新型机械导航系统辅助穿刺初步实验研究</td>\n",
       "      <td>文艺; 李晓冰; 吴智群</td>\n",
       "      <td>介入放射学杂志</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>人机对抗智能技术最新进展及军事应用</td>\n",
       "      <td>聂凯; 曾科军; 孟庆海; 魏超</td>\n",
       "      <td>兵器装备工程学报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>29.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>人工智能时代高校翻译技术实践环境建设研究</td>\n",
       "      <td>曹达钦; 戴钰涵</td>\n",
       "      <td>外语界</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>融合视觉显著性再检测的孪生网络无人机目标跟踪算法  网络首发</td>\n",
       "      <td>周士琪; 王耀南; 钟杭</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-23 15:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>217.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>军事智能化的瓶颈与关键问题研究  网络首发</td>\n",
       "      <td>刘伟</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-06-23 14:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>80.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>思索·睿智:迷雾中的笃行要件——记第55次情报科学读书会</td>\n",
       "      <td>于伟; 苏鹏</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>多智能体协作场景下基于强化学习值分解的计算卸载策略  网络首发</td>\n",
       "      <td>张鹏; 田辉; 赵鹏涛; 贺硕; 童一帆</td>\n",
       "      <td>通信学报</td>\n",
       "      <td>2021-06-22 16:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>160.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>人工智能范式的革命与通用智能理论的创生  网络首发</td>\n",
       "      <td>钟义信</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-22 15:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>165.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>基于人工智能算法的作业现场人员设备资质识别技术研究  网络首发</td>\n",
       "      <td>陈晓江; 龙震岳; 曾纪钧</td>\n",
       "      <td>电测与仪表</td>\n",
       "      <td>2021-06-22 10:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>192.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                                 篇名  \\\n",
       "0            1    机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发   \n",
       "1            2                                 关于智能化战争的基本认知  网络首发   \n",
       "2            3                         金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "3            4                            卫星在轨故障案例与人工智能故障诊断  网络首发   \n",
       "4            5                            高等职业教育智能生态系统:内涵、结构与实践路径   \n",
       "5            6                     近20年在线学习环境研究评述——基于LDA和DTM的动态分析   \n",
       "6            7                                 教育人工智能场域下教师角色与行动取向   \n",
       "7            8                             智能财务人才培养与浙江大学的探索  网络首发   \n",
       "8            9                     机器学习在智能配用电领域的应用：北美工程实践概述  网络首发   \n",
       "9           10                        国际经贸协定中的源代码规则新发展及中国立场  网络首发   \n",
       "10          11                        人工智能赋能高校数据治理：逻辑、挑战与实践  网络首发   \n",
       "11          12                             嵌入式神经网络加速器及SoC芯片  网络首发   \n",
       "12          13                                    绿色理念下智慧零售创新发展路径   \n",
       "13          14                 数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》   \n",
       "14          15                       智能化金融监管：模型框架、边缘约束和实践策略  网络首发   \n",
       "15          16                             “智能+”时代的现代文化产业体系：挑战与重塑   \n",
       "16          17                    人工智能在胸部创伤肋骨骨折CT诊断中应用的初步研究  网络首发   \n",
       "17          18                             人工智能技术在火电行业的应用探讨  网络首发   \n",
       "18          19                           基于切换输出机制的超短期风电功率预测  网络首发   \n",
       "19          20                        DCN:双通道密集哈达玛卷积的画质评价网络  网络首发   \n",
       "20          21                                 智能交通管理系统发展趋势  网络首发   \n",
       "21          22              人工智能写作背景下作者主体性的消解与重构——以陈楸帆人机交互写作实验为中心   \n",
       "22          23                           空气源热泵除霜控制方法研究现状及展望  网络首发   \n",
       "23          24                         面向机器人自主分割的肉品识别分类系统实现  网络首发   \n",
       "24          25                              AI辅助头颈CTA在诊断颅内动脉瘤中的应用   \n",
       "25          26                     人工智能模型预测输尿管结石自然排出的多中心临床试验的验证研究   \n",
       "26          27                               城市暴雨内涝综述：特征、机理、数据与方法   \n",
       "27          28                           基于计算机视觉的织物光泽测试方法研究  网络首发   \n",
       "28          29       MIT Technology Review 2021年“十大突破性技术”解读  网络首发   \n",
       "29          30                               基于区块链的联邦学习技术综述  网络首发   \n",
       "30          31                              竞技二打一游戏中同等牌力的研究  网络首发   \n",
       "31          32  新信息技术对高等教育影响的演变及反思——基于2004-2021年《地平线报告》内容分析  网络首发   \n",
       "32          33                                   机器人示教学习与技能泛化实验设计   \n",
       "33          34               CoTransH: 科技文献知识图谱中语义关系预测的翻译模型  网络首发   \n",
       "34          35                                    管道数字孪生体模型的构建及应用   \n",
       "35          36                                 清华大学TH-Health研究室简介   \n",
       "36          37                                 大数据智能时代地图学课程内容改革探索   \n",
       "37          38                        机器人智能化焊接技术发展综述及其在运载火箭贮箱中的应用   \n",
       "38          39                                  智能博弈趋势下未来空天防御体系展望   \n",
       "39          40                              未来智能化网络化多功能卫星系统技术发展思考   \n",
       "40          41  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "41          42                                 新型机械导航系统辅助穿刺初步实验研究   \n",
       "42          43                                  人机对抗智能技术最新进展及军事应用   \n",
       "43          44                               人工智能时代高校翻译技术实践环境建设研究   \n",
       "44          45                     融合视觉显著性再检测的孪生网络无人机目标跟踪算法  网络首发   \n",
       "45          46                              军事智能化的瓶颈与关键问题研究  网络首发   \n",
       "46          47                       思索·睿智:迷雾中的笃行要件——记第55次情报科学读书会   \n",
       "47          48                    多智能体协作场景下基于强化学习值分解的计算卸载策略  网络首发   \n",
       "48          49                          人工智能范式的革命与通用智能理论的创生  网络首发   \n",
       "49          50                    基于人工智能算法的作业现场人员设备资质识别技术研究  网络首发   \n",
       "\n",
       "                         作者               刊名              发表时间  被引     下载  操作  \\\n",
       "0                  代林序; 张玉洁            档案与建设  2021-07-02 16:16 NaN    NaN  下载   \n",
       "1                        郭明        人民论坛·学术前沿  2021-07-02 15:49 NaN    NaN  下载   \n",
       "2             陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN    NaN  下载   \n",
       "3        王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬         中国空间科学技术  2021-07-02 08:49 NaN    NaN  下载   \n",
       "4                        徐晔           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "5                  牛晓杰; 郑勤华           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "6             赵磊磊; 马玉菲; 代蕊华           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "7                    陈俊; 董望             财会月刊  2021-07-01 15:42 NaN    NaN  下载   \n",
       "8    李亦言; 胡荣兴; 宋立冬; 贾乾罡; 陆宁          电力系统自动化  2021-07-01 09:50 NaN    NaN  下载   \n",
       "9                       鄢雨虹          武大国际法评论  2021-07-01 09:16 NaN    NaN  下载   \n",
       "10                      赵磊磊           重庆高教研究  2021-06-30 14:14 NaN  114.0  下载   \n",
       "11             易冬柏; 陈恒; 何乐年           仪器仪表学报  2021-06-30 10:09 NaN   59.0  下载   \n",
       "12                       翟璇           商业经济研究        2021-06-30 NaN    6.0  下载   \n",
       "13                      单浩耘           商业经济研究        2021-06-30 NaN   15.0  下载   \n",
       "14                      乔宇锋             南方金融  2021-06-29 17:04 NaN  105.0  下载   \n",
       "15                 解学芳; 雷文宣  深圳大学学报(人文社会科学版)  2021-06-29 15:45 NaN   65.0  下载   \n",
       "16        刘想;谢辉辉;许玉峰;陶晓峰;柳林    上海交通大学学报(医学版)  2021-06-29 14:47 NaN   38.0  下载   \n",
       "17    华志刚; 范佳卿; 郭荣; 汪勇; 吴潇翔             中国电力  2021-06-29 11:10 NaN  127.0  下载   \n",
       "18             杨茂; 许传宇; 王凯旋            高电压技术  2021-06-29 11:02 NaN   23.0  下载   \n",
       "19        杨晓东; 韩振奇; 刘立庄; 赵丹         计算机工程与应用  2021-06-29 09:20 NaN   26.0  下载   \n",
       "20                 李瑞敏; 王长君    清华大学学报(自然科学版)  2021-06-29 08:59 NaN   94.0  下载   \n",
       "21                      周建琼             当代文坛        2021-06-29 NaN   28.0  下载   \n",
       "22  王沣浩; 马龙霞; 王志华; 楼业春; 刘孜璇             制冷学报  2021-06-28 10:21 NaN   60.0  下载   \n",
       "23        马欢; 冀晶晶; 刘佳豪; 刘雨婷             图学学报  2021-06-28 08:48 NaN  150.0  下载   \n",
       "24         邓昊;韦鑫;曹闻挺;艾光勇;余菡         第三军医大学学报        2021-06-28 NaN    6.0  下载   \n",
       "25     曾凯; 王新敏; 倪钊; 王勤章; 李强           中国全科医学        2021-06-28 NaN   18.0  下载   \n",
       "26             黄华兵; 王先伟; 柳林           地理科学进展        2021-06-28 NaN    NaN  下载   \n",
       "27             张建新; 黄钢; 李消晋               丝绸  2021-06-25 17:11 NaN  271.0  下载   \n",
       "28         祁海;张民;李俊涛;张小松;张强           中国科学基金  2021-06-25 17:07 NaN  140.0  下载   \n",
       "29               李凌霄;袁莎;金银玉          计算机应用研究  2021-06-25 16:23 NaN  365.0  下载   \n",
       "30        李淑琴; 陈子鹏; 郑蓝舟; 孟坤           智能系统学报  2021-06-25 16:03 NaN   84.0  下载   \n",
       "31         梁志星; 冯兴杰; 李佳; 杨珂           当代教育论坛  2021-06-25 16:03 NaN  199.0  下载   \n",
       "32              占宏; 李娴; 杨辰光          实验技术与管理  2021-06-25 15:39 NaN   79.0  下载   \n",
       "33              陶玥; 余丽; 吴振新          情报理论与实践  2021-06-25 11:16 NaN   88.0  下载   \n",
       "34       陈斯迅;李在蓉;王禹钦;关红亮;高丽             油气储运        2021-06-25 NaN  220.0  下载   \n",
       "35                      NaN             针刺研究        2021-06-25 NaN   18.0  下载   \n",
       "36         刘慧敏; 邓敏; 刘宝举; 陈杰             测绘通报        2021-06-25 NaN   24.0  下载   \n",
       "37       林尚扬;杨学勤;徐爱杰;陈华斌;林涛        上海航天(中英文)        2021-06-25 NaN   24.0  下载   \n",
       "38                      王波兰        上海航天(中英文)        2021-06-25 NaN   13.0  下载   \n",
       "39                      陈占胜        上海航天(中英文)        2021-06-25 NaN    9.0  下载   \n",
       "40                      张诗雨             锻压技术        2021-06-25 NaN    6.0  下载   \n",
       "41             文艺; 李晓冰; 吴智群          介入放射学杂志        2021-06-25 NaN    1.0  下载   \n",
       "42         聂凯; 曾科军; 孟庆海; 魏超         兵器装备工程学报        2021-06-25 NaN   29.0  下载   \n",
       "43                 曹达钦; 戴钰涵              外语界        2021-06-25 NaN    NaN  下载   \n",
       "44             周士琪; 王耀南; 钟杭           智能系统学报  2021-06-23 15:11 NaN  217.0  下载   \n",
       "45                       刘伟        人民论坛·学术前沿  2021-06-23 14:04 NaN   80.0  下载   \n",
       "46                   于伟; 苏鹏          情报理论与实践        2021-06-23 NaN   19.0  下载   \n",
       "47     张鹏; 田辉; 赵鹏涛; 贺硕; 童一帆             通信学报  2021-06-22 16:50 NaN  160.0  下载   \n",
       "48                      钟义信           智能系统学报  2021-06-22 15:09 NaN  165.0  下载   \n",
       "49            陈晓江; 龙震岳; 曾纪钧            电测与仪表  2021-06-22 10:38 NaN  192.0  下载   \n",
       "\n",
       "                                                详细页链接  \n",
       "0   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "1   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "2   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "3   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "4   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "5   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "6   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "7   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "8   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "9   https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "10  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "11  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "12  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "13  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "14  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "15  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "16  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "17  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "18  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "19  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "20  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "21  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "22  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "23  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "24  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "25  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "26  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "27  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "28  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "29  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "30  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "31  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "32  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "33  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "34  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "35  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "36  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "37  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "38  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "39  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "40  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "41  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "42  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "43  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "44  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "45  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "46  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "47  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "48  https://kns.cnki.net/kcms/detail/detail.aspx?d...  \n",
       "49  https://kns.cnki.net/kcms/detail/detail.aspx?d...  "
      ]
     },
     "execution_count": 25,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "links=[]\n",
    "\n",
    "for link in href:\n",
    "    link=correct(link)\n",
    "    links.append(link)\n",
    "    df_links=pd.DataFrame({'详细页链接':links})\n",
    "    df_首页=pd.concat([pd.read_html(页面_表格_html)[0],df_links],axis=1)\n",
    "\n",
    "df_首页"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### PDF链接"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 26,
   "metadata": {},
   "outputs": [],
   "source": [
    "from requests_html import HTMLSession\n",
    "import urllib.parse"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 27,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['/kcms/download.aspx?filename=2I1bhVkZNRXVzFmZ4JzUWllYklzd1E3M0YHTMZjd3QTWsl1K4sCNRJ2Z5RXblN0LkhjTWFWUqpEdZNmRmF3M3w2bzgzV1RWZ2sWVDRlNo52YjV1LBBFSmFWcyhmcmlURHF2LGJVVoNkWz4kU3sSWXpESwc3YPJzb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=6ticMRkZx9GWYBDapN0Ui90MoJmeLdzZ4pnRjBVWQZXZQxGRzVDSP1USvJ3TYJFSrRmUNxkSDN2ZCZUSWdDUHhVR480RjFkN5c1TKR2LzJ0dwB1V4cVbWlUaNRGOxQWePdjerEVWZlUQxMTTytkejl3Qp1kcC9Wc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=6ticMRkZx9GWYBDapN0Ui90MoJmeLdzZ4pnRjBVWQZXZQxGRzVDSP1USvJ3TYJFSrRmUNxkSDN2ZCZUS5I2ZxZTb4QWUwNHdrIlb5kTao50dwJGdWZXbWlUaNRGOxQWePdjerEVWZlUQxMTTytkejl3Qp1kcC9Wc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=KhEV4p2cFJGcu5UVYN2NRFjMr1WdVlUMJRzL5cmNaNFSONWbCdTaWFmMvk0Qmd1USN2bndWdEZkc3F2T6hVe5dGZU5GTwNmQ0oWZGRlauZnYxsSe1JXO4c1aUxmY4YWRslmTlxEWTNTWXt2a6RHVDJHZRt0RjZjV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FUG1UUa5Uaxt0cv8iU09SSzATNmdTRRBTdwsGa1gDRoV0bx9SbSRVWXxkQ2F0ZVFnS4JVblhVZSN0U=0TTyYnbmJmTBljQygTO08CSzNmSHtCblxWUP52UWl0ZzMUeFRTWnJURT5ET1AnW4IWO1lGdzhDRDF&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=FUG1UUa5Uaxt0cv8iU09SSzATNmdTRRBTdwsGa1gDRoV0bx9SbSRVWXxkQ2F0ZVFnS4JVblhVZSN0U=0zc3UnbmJmTBljQygTO08CSzNmSHtCblxWUP52UWl0ZzMUeFRTWnJURT5ET1AnW4IWO1lGdzhDRDF&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=XSuFVVJJ0L5EnWQdlaHRmRDR3RKNmSBtWM08kbG5mV5tGbWR2a2RXYpx2TwpmZzhFcnNkZGF3S01mV=0DNyEkSItUTWtWaRdld3l2NhVkQ0lmdttWWZ1UbDZ0dLJ3daVDb3siUyVVMXdVb2pWSsJkWJB1Zwl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=wlXSuFVVJJ0L5EnWQdlaHRmRDR3RKNmSBtWM08kbG5mV5tGbWR2a2RXYpx2TwpmZzhFcnNkZGF3S01mVrt2LrwkW112a5l1SDp3ahhEUnxWY4U0NxkneyR3YTtEdiJzVxc3bpx2R2siUyVVMXdVb2pWSsJkWJB1Z&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=G92LjFESuFme2E1dBVlQLJzQQ1mTNVmNJh0YHhnNF9ET4YDU4AzUTtkMHJmWItSbHRXat5GWmlEcOhVWYpkaPFzRoZUeXZTbWpneE90Lq1WZBNzN4VWW3R2anRUS3NHSSlFd0QnavJ2R6Z1U2VDOhxWUnlmSPd1M&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=G92LjFESuFme2E1dBVlQLJzQQ1mTNVmNJh0YHhnNF9ET4YDU4AzUTtkMHJmWItSbHRXat5GWmlEcOhVWQBHWTtSau10NlhHNslkNNVTWxxWc1Q1RLRzY3R2anRUS3NHSSlFd0QnavJ2R6Z1U2VDOhxWUnlmSPd1M&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=UlmdVxmcqJUSNdFSZFWM2F3MvU0atdEb2QGMUFHO3p3ZrMzaNNWTE5mc04kUjpHODVXMMhFUHRVVopnYQFmbtljdo52TGdTNiRGO59kdtJETHd2TRVURCpHa20kdidXMVJ0Yyo3RlFEMRdUb0hEZrZ3RqhWWVVzb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=UlmdVxmcqJUSNdFSZFWM2F3MvU0atdEb2QGMUFHO3p3ZrMzaNNWTE5mc04kUjpHODVXMMhFUHRVVopnYOZjV1IHNQVkeBJUQDB1ZnVnYKZVUsBzVRVURCpHa20kdidXMVJ0Yyo3RlFEMRdUb0hEZrZ3RqhWWVVzb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=kbjJlNQ9keTlzZ3gjSLxGM6RHTCNUNQhGbiFmcI5mZl50MplWWKVzdvJkbMR3Mvc2YPlUSo1WSKtmZ=0DOkJ2SFJXOElneXhEa5kDZ3kVZmNkbBFFOqlHT2MjdBV3VkhmdhFTZ1pEeBdWcB5mQqR1cX1GVq9&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=kbjJlNQ9keTlzZ3gjSLxGM6RHTCNUNQhGbiFmcI5mZl50MplWWKVzdvJkbMR3Mvc2YPlUSo1WSKtmZ=0zb5tSZ2IXOElneXhEa5kDZ3kVZmNkbBFFOqlHT2MjdBV3VkhmdhFTZ1pEeBdWcB5mQqR1cX1GVq9&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=xUlYWF0TRVlYFJ2VMZVN2hEO5cVRuF3c1dTWoVGOlFDa0R1KGFFO2AHMOBFUyFFdLVWUKRnQCVkbkVVa4Y0R55mQoRjeoN3aYVGbKNTdY1GMTllMCp0aql2bGVDS1NGZ0kmQXZGVvomMsxmYH1kMZh1brcUbGljY&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=lYWF0TRVlYFJ2VMZVN2hEO5cVRuF3c1dTWoVGOlFDa0R1KGFFO2AHMOBFUyFFdLVWUKRnQCVkbkVVa=0zZNd0SLdXNlt0NKJjS3o1SYlVUn9SVrhlU2YnUqRWRaZzcNF3dvomMsxmYH1kMZh1brcUbGljYxU&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=RdFMDZXWzgnRhRFdT9GcTt0YhJTUw40b6JVSGlmQClzKFp0Trd1cyZFWvF1aE52b4gDbI1GdhB1UHdHbV1GOQFWZrUVWSF3K4NUW38ySNhmNqR0SjZGMqhVRuF0NvQ2SIJVWGF2LzxmbkVjWXZ0axtWWOJka5cVM&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=odnQ15Ub3YnU3NERtN0Z0AXYwcVd0QVR5EHU3lWNIJHdjJHO1RTaRBlcrMERixmQXt2cqdFZChWehhGc4QGOKZ2KoNmVMN3L5V2cYhlY5UUOBhjShplWaJnU5M2dxB1b0MGT2JTeVZGNrMTVyoEeiZFZkR1MXJWU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=odnQ15Ub3YnU3NERtN0Z0AXYwcVd0QVR5EHU3lWNIJHdjJHO1RTaRBlcrMERixmQXt2cqdFZChWehhGcCNXRNd3QilzKoJjRrIWOUFFSTRnbvRlTsVmWaJnU5M2dxB1b0MGT2JTeVZGNrMTVyoEeiZFZkR1MXJWU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=RdUaWJGUIJUaL5Ed3tUZ5wEejBjT24mM55GT5hEOHp3ZFJ3ZHdWTWt0MLlFc2BnV3EXMnh0VjJEbDJ1cx9SY2h0T0NEW1sEN1RzR44WdL1EWoVVNnVTUXZWVNJlVYFlMKVXc4pkYXpXbRlUdwIDU5lkNatSdUNzL&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=UJmYuZTbU9SMDRHSBpUNl5WQ510Y0MFZRRlbz92N2hmNuxWcZhVVXJHWKF2LNVzS4RmboN3TDtUUXVndvEXYm9SVuZVQplHRMxkWINHRLxUc3FVUUt2cw5mMhZlN3UzSMhFetVXR3VmVFJGO3YXRrVnSUFVS48ke&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mYuZTbU9SMDRHSBpUNl5WQ510Y0MFZRRlbz92N2hmNuxWcZhVVXJHWKF2LNVzS4RmboN3TDtUUXVnd=0zbhJlQ0NDRZB3ZrQTVnZXSD9GMJdFNFdkMJhWazhjezVGVuh3T6VmVFJGO3YXRrVnSUFVS48keUJ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=y8mSnllavREOOhVOYhlMvFEU2J1UHlEcSJzYkBTSyJWZJZUaEdWeMx0LYdHVn9UOvclMKNGSkR2d5VWeQZnR1V1VEdWNp1ETOdlcslETolUUh1WbllzaoNTexFza69mbOR3NINUR4JTMsZzSSFHe4N2Z61mUxoFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=y8mSnllavREOOhVOYhlMvFEU2J1UHlEcSJzYkBTSyJWZJZUaEdWeMx0LYdHVn9UOvclMKNGSkR2d5VWenR0SzEWSDNTQ4dUbyt0NTVDT3p3U5olRxF2aoNTexFza69mbOR3NINUR4JTMsZzSSFHe4N2Z61mUxoFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mSnllavREOOhVOYhlMvFEU2J1UHlEcSJzYkBTSyJWZJZUaEdWeMx0LYdHVn9UOvclMKNGSkR2d5VWe=0zYYRlTiREeUpETDBXWadGasNVcoJzUBBTNDZ0RKp1TKBldHVHU5JTMsZzSSFHe4N2Z61mUxoFVy8&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=WVsZUQFJHMKdVV3YHdu1kRHRHRrV2UrAXdIV3VqpUUDhURal3b5c1Shl1Yzk3QrBnRi5keFdnYU90Q=0TQrETO5NHZzZDVkVDWPFUOuZzKhpmVJlnQxVDaYVTV5NDUyUWVMJXcro1MTp2cDZ2N2x0Zk52ZSt&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=VNjR1KwkHWC92Skl2aCJ1RLd3KqhVWBVkTSRVMWJEdIhldC1US2tiM5BVZaNVM6ZUSil3cmd0T2JnR=0zZ1dETh9UVmVDWkdWUBRXUzATQHVWRW5GR2Y1bGlGZuV3aLVVdGJjY6VkQLRUMI9mMMFnWQh2TJl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=JlVNjR1KwkHWC92Skl2aCJ1RLd3KqhVWBVkTSRVMWJEdIhldC1US2tiM5BVZaNVM6ZUSil3cmd0T2JnRUR2UBx2dlBTVMVjWzdVWDhUYx5EbxkFUxEzQ0FXeDhjMtNkWv4meJd1TGJjY6VkQLRUMI9mMMFnWQh2T&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=lZzLB10NCplUaRFbsN0UOx0MzVnMmdmew82bxRlY2Ulc1hUN3BlYiJHaxZUNvhUYzZjR0o2a4pFdQJWS6dmdshWQ3plMjlUTapVTHZVOwllbphkajFDVHVFaJl1LQtUdqZDbwR2SIh0c5YGZPlDZnJHaXhGUKp3V&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=3tiZMhDayIXZzADbYpneIxkZoNnd6Z1ayRVNpVUeM10T4AzN08kSwskMuZESYNmMxFkboR1YZJnWq1ETsdGc4k1KxokZEJ1VXNjWadEci5Gdq9yZTFTchd3RtlEZFNTZNZjWWJlMkNzal9CMSdzQykVZ5FUTipUc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=vEmZHVjQ2IXd4sWR3cnd1EDU5tSZod1bK1UYpF1QBJletF3K6VUaw80awQFMItUatNFRuVkV6NURM9GUC9iet5EcN12TuZ0LyAzNBlmTzgkaHZ3Yk9ySpNkcQJnSzlWdJ1WdwhWbs5meYhVRnlGMrpkWJZnayMFb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=vEmZHVjQ2IXd4sWR3cnd1EDU5tSZod1bK1UYpF1QBJletF3K6VUaw80awQFMItUatNFRuVkV6NURM9GU1V1QiN0RUlmNL9yLplVU3MjeBh3auZXM5V3SpNkcQJnSzlWdJ1WdwhWbs5meYhVRnlGMrpkWJZnayMFb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=WW1FmR48SZJtycF9CNwAFWVlnNwNWWZlFMhZjSOVDe4gUVw9yN69UNUBlaUJGO4UlTkBnThVlcml1U=0TQYNmV65ERFhTQBl1cix2KBFGaoN0TrRVYzoEeXtkTm1mZ5pkVK9COZF0bJFUevczctZzdlNmays&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=sp1d3ATMI1kV3cnQZl2Y5UWMxlzQMVlcvZ3TGRmWtNUVEl3KatyTkpFdtJTS0UnUMZTQllWeC5GWJpkVHR0UEBlNLlzVuN0MzZmShdHM04Gb5kXSMdkZVNzcwxWYxImUBVTdwM1RzNXMvI0N4IWV1QUdmlzQ6JHc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1d3ATMI1kV3cnQZl2Y5UWMxlzQMVlcvZ3TGRmWtNUVEl3KatyTkpFdtJTS0UnUMZTQllWeC5GWJpkV=0zdxJEbJV0R5hmaGl1ZwAjNC52N5sUVwh3TGdkcINnV21Eb0YGb0NXMvI0N4IWV1QUdmlzQ6JHcsp&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mT6pHa0kXV1QmaWZjbyY0Vjd3YTpXcy9UMaRTNLVUaOtCS5hEV2d0VhtkSMdGUQJ2MwMVcil3QjxWW=0TWBJHUhlGTKBzVMpVOPtEaxAlRQNjMxoEWyJmT6FkbkVTNWlkNpRUUopGe3JFcvM0RahlRHhmbpl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mT6pHa0kXV1QmaWZjbyY0Vjd3YTpXcy9UMaRTNLVUaOtCS5hEV2d0VhtkSMdGUQJ2MwMVcil3QjxWW=0za14WduBVROFkU0cjNURmWCB1R002dwh3UyJmT6FkbkVTNWlkNpRUUopGe3JFcvM0RahlRHhmbpl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=0ZqVWbRtWTMdHdr9CdEJ3Sad0cu10KUpWe0ZjQiFERSp0d0AFT352Uxg3M3pVa5onQWRkaDFFcFd1Y=0DOLJnUHVlWsJHaPRXS4sEUwUDZXt2LBl0TlB1NFhUYthlZWhETv1UYzpVaDFWTk5mTqd1Krd1Rxs&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=0ZqVWbRtWTMdHdr9CdEJ3Sad0cu10KUpWe0ZjQiFERSp0d0AFT352Uxg3M3pVa5onQWRkaDFFcFd1Y=0zaIZnUHVlWsJHaPRXS4sEUwUDZXt2LBl0TlB1NFhUYthlZWhETv1UYzpVaDFWTk5mTqd1Krd1Rxs&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=zVDhFN5VjWrRDdNRVYrEkQ0wGaMR3YSNWQwIje2tETqV3Z6l0ZBhmU5sWVWpUTMZkT19mYkpmVZdkZ=0zZnNkWnRGZLZleHFValpWa1smeXdTRxQ2Yk12SydFRQZmY2plVxFHd5UTQk9mNrolZRBVT6NjY4F&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=zVDhFN5VjWrRDdNRVYrEkQ0wGaMR3YSNWQwIje2tETqV3Z6l0ZBhmU5sWVWpUTMZkT19mYkpmVZdkZ=0zaJdmTupFbv8WQVplWPh3KlVTbCF1TPhVYk12SydFRQZmY2plVxFHd5UTQk9mNrolZRBVT6NjY4F&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=zVDhFN5VjWrRDdNRVYrEkQ0wGaMR3YSNWQwIje2tETqV3Z6l0ZBhmU5sWVWpUTMZkT19mYkpmVZdkZ=0DNCF1c1M1N6tkQ4J1Rl9EcvwWQvNGenFWYk12SydFRQZmY2plVxFHd5UTQk9mNrolZRBVT6NjY4F&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mctVnR5cGaSNmWEpmWrknT4RHMsRnNNNEOEdnV1Q0arRWb5VVO0MzYh1UQTVXbCh0cTlVVEJkQClWa=0zYj1WOzQEMQh2TtpUZxQ1V1AHdMhXeqtiZDh3RqVlQykXRXp1SxYzYkR2aMJkSz92MttyUWJGZCh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=mctVnR5cGaSNmWEpmWrknT4RHMsRnNNNEOEdnV1Q0arRWb5VVO0MzYh1UQTVXbCh0cTlVVEJkQClWa=0TUKlVchVnT5sSVS90SihXZ34kVsB3KBl3ZEh3RqVlQykXRXp1SxYzYkR2aMJkSz92MttyUWJGZCh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=xMVRXpkZWVGMRhHe5pXdVFjSzZGMSZnczsidnBnctZUNJ1EMWJTdYhkWiRFSTRldV9UbzpUTX1kZVRVbVNFOmNWe15GWKVmS4wGUXhWYqhjc2gHZZRTN5E0KTREZWhHUshGRIJURHtkd4dWUBpndCNmWr8UVa5Ga&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=xMVRXpkZWVGMRhHe5pXdVFjSzZGMSZnczsidnBnctZUNJ1EMWJTdYhkWiRFSTRldV9UbzpUTX1kZVRVb2BjSCpEM2UlM4d0QOJWbCtUVIRnelN3U4dGN5E0KTREZWhHUshGRIJURHtkd4dWUBpndCNmWr8UVa5Ga&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=VRXpkZWVGMRhHe5pXdVFjSzZGMSZnczsidnBnctZUNJ1EMWJTdYhkWiRFSTRldV9UbzpUTX1kZVRVb=0zcrg2UxQXQ4IWQ2Mma280axkWUYR2ZDFVd4AXb15kR0o1VqZlbHtkd4dWUBpndCNmWr8UVa5GaxM&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=2tEUvdWMyQ3bTVFcShjaMhjboxWY4RUYIp1d1Enb4d1aXh0dVpXWnVDWxYFTvJkcCtkbVVXR4ZGV4REctZ1T3plWSpWM3EVNBl3dOpHaMlUUvh3azI3Sh5WUlVzQGVEM2Vla250ZldFSnN0Rn1GMr40R252L4Ezb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1kGVDRXO0sSdihEOzZzdrR2YqR2NBdlUxhGTaRTS6JUN4dWcxMHSMNDerdHW0FneORmcBZGeYhXeSd2ciVDO08kcuN3aYtUUjhnbMRFNRJWeYZGN3t2RYZkdrZkZMpWQTd2ZjNVaQhjSupWQSZUbnFzLRVHMTd1K&tablename=CAPJLAST&dflag=pdfdown',\n",
       " '/kcms/download.aspx?filename=1kGVDRXO0sSdihEOzZzdrR2YqR2NBdlUxhGTaRTS6JUN4dWcxMHSMNDerdHW0FneORmcBZGeYhXeSd2ckJ1YFNHaJh2Kj12djRmU2dmWTdDajRkQKF0RYZkdrZkZMpWQTd2ZjNVaQhjSupWQSZUbnFzLRVHMTd1K&tablename=CAPJLAST&dflag=pdfdown']"
      ]
     },
     "execution_count": 27,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "session = HTMLSession()\n",
    "\n",
    "pdf_links=[]\n",
    "\n",
    "for url in links:\n",
    "    r = session.get(url)\n",
    "    pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "    pdf_links.append(pdf_link_xpath)\n",
    "pdf_links"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 28,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['https://kns.cnki.net/kcms/download.aspx?filename=2I1bhVkZNRXVzFmZ4JzUWllYklzd1E3M0YHTMZjd3QTWsl1K4sCNRJ2Z5RXblN0LkhjTWFWUqpEdZNmRmF3M3w2bzgzV1RWZ2sWVDRlNo52YjV1LBBFSmFWcyhmcmlURHF2LGJVVoNkWz4kU3sSWXpESwc3YPJzb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=6ticMRkZx9GWYBDapN0Ui90MoJmeLdzZ4pnRjBVWQZXZQxGRzVDSP1USvJ3TYJFSrRmUNxkSDN2ZCZUSWdDUHhVR480RjFkN5c1TKR2LzJ0dwB1V4cVbWlUaNRGOxQWePdjerEVWZlUQxMTTytkejl3Qp1kcC9Wc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=6ticMRkZx9GWYBDapN0Ui90MoJmeLdzZ4pnRjBVWQZXZQxGRzVDSP1USvJ3TYJFSrRmUNxkSDN2ZCZUS5I2ZxZTb4QWUwNHdrIlb5kTao50dwJGdWZXbWlUaNRGOxQWePdjerEVWZlUQxMTTytkejl3Qp1kcC9Wc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=KhEV4p2cFJGcu5UVYN2NRFjMr1WdVlUMJRzL5cmNaNFSONWbCdTaWFmMvk0Qmd1USN2bndWdEZkc3F2T6hVe5dGZU5GTwNmQ0oWZGRlauZnYxsSe1JXO4c1aUxmY4YWRslmTlxEWTNTWXt2a6RHVDJHZRt0RjZjV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FUG1UUa5Uaxt0cv8iU09SSzATNmdTRRBTdwsGa1gDRoV0bx9SbSRVWXxkQ2F0ZVFnS4JVblhVZSN0U=0TTyYnbmJmTBljQygTO08CSzNmSHtCblxWUP52UWl0ZzMUeFRTWnJURT5ET1AnW4IWO1lGdzhDRDF&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=FUG1UUa5Uaxt0cv8iU09SSzATNmdTRRBTdwsGa1gDRoV0bx9SbSRVWXxkQ2F0ZVFnS4JVblhVZSN0U=0zc3UnbmJmTBljQygTO08CSzNmSHtCblxWUP52UWl0ZzMUeFRTWnJURT5ET1AnW4IWO1lGdzhDRDF&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=XSuFVVJJ0L5EnWQdlaHRmRDR3RKNmSBtWM08kbG5mV5tGbWR2a2RXYpx2TwpmZzhFcnNkZGF3S01mV=0DNyEkSItUTWtWaRdld3l2NhVkQ0lmdttWWZ1UbDZ0dLJ3daVDb3siUyVVMXdVb2pWSsJkWJB1Zwl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=wlXSuFVVJJ0L5EnWQdlaHRmRDR3RKNmSBtWM08kbG5mV5tGbWR2a2RXYpx2TwpmZzhFcnNkZGF3S01mVrt2LrwkW112a5l1SDp3ahhEUnxWY4U0NxkneyR3YTtEdiJzVxc3bpx2R2siUyVVMXdVb2pWSsJkWJB1Z&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=G92LjFESuFme2E1dBVlQLJzQQ1mTNVmNJh0YHhnNF9ET4YDU4AzUTtkMHJmWItSbHRXat5GWmlEcOhVWYpkaPFzRoZUeXZTbWpneE90Lq1WZBNzN4VWW3R2anRUS3NHSSlFd0QnavJ2R6Z1U2VDOhxWUnlmSPd1M&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=G92LjFESuFme2E1dBVlQLJzQQ1mTNVmNJh0YHhnNF9ET4YDU4AzUTtkMHJmWItSbHRXat5GWmlEcOhVWQBHWTtSau10NlhHNslkNNVTWxxWc1Q1RLRzY3R2anRUS3NHSSlFd0QnavJ2R6Z1U2VDOhxWUnlmSPd1M&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=UlmdVxmcqJUSNdFSZFWM2F3MvU0atdEb2QGMUFHO3p3ZrMzaNNWTE5mc04kUjpHODVXMMhFUHRVVopnYQFmbtljdo52TGdTNiRGO59kdtJETHd2TRVURCpHa20kdidXMVJ0Yyo3RlFEMRdUb0hEZrZ3RqhWWVVzb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=UlmdVxmcqJUSNdFSZFWM2F3MvU0atdEb2QGMUFHO3p3ZrMzaNNWTE5mc04kUjpHODVXMMhFUHRVVopnYOZjV1IHNQVkeBJUQDB1ZnVnYKZVUsBzVRVURCpHa20kdidXMVJ0Yyo3RlFEMRdUb0hEZrZ3RqhWWVVzb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=kbjJlNQ9keTlzZ3gjSLxGM6RHTCNUNQhGbiFmcI5mZl50MplWWKVzdvJkbMR3Mvc2YPlUSo1WSKtmZ=0DOkJ2SFJXOElneXhEa5kDZ3kVZmNkbBFFOqlHT2MjdBV3VkhmdhFTZ1pEeBdWcB5mQqR1cX1GVq9&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=kbjJlNQ9keTlzZ3gjSLxGM6RHTCNUNQhGbiFmcI5mZl50MplWWKVzdvJkbMR3Mvc2YPlUSo1WSKtmZ=0zb5tSZ2IXOElneXhEa5kDZ3kVZmNkbBFFOqlHT2MjdBV3VkhmdhFTZ1pEeBdWcB5mQqR1cX1GVq9&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=xUlYWF0TRVlYFJ2VMZVN2hEO5cVRuF3c1dTWoVGOlFDa0R1KGFFO2AHMOBFUyFFdLVWUKRnQCVkbkVVa4Y0R55mQoRjeoN3aYVGbKNTdY1GMTllMCp0aql2bGVDS1NGZ0kmQXZGVvomMsxmYH1kMZh1brcUbGljY&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=lYWF0TRVlYFJ2VMZVN2hEO5cVRuF3c1dTWoVGOlFDa0R1KGFFO2AHMOBFUyFFdLVWUKRnQCVkbkVVa=0zZNd0SLdXNlt0NKJjS3o1SYlVUn9SVrhlU2YnUqRWRaZzcNF3dvomMsxmYH1kMZh1brcUbGljYxU&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=RdFMDZXWzgnRhRFdT9GcTt0YhJTUw40b6JVSGlmQClzKFp0Trd1cyZFWvF1aE52b4gDbI1GdhB1UHdHbV1GOQFWZrUVWSF3K4NUW38ySNhmNqR0SjZGMqhVRuF0NvQ2SIJVWGF2LzxmbkVjWXZ0axtWWOJka5cVM&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=odnQ15Ub3YnU3NERtN0Z0AXYwcVd0QVR5EHU3lWNIJHdjJHO1RTaRBlcrMERixmQXt2cqdFZChWehhGc4QGOKZ2KoNmVMN3L5V2cYhlY5UUOBhjShplWaJnU5M2dxB1b0MGT2JTeVZGNrMTVyoEeiZFZkR1MXJWU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=odnQ15Ub3YnU3NERtN0Z0AXYwcVd0QVR5EHU3lWNIJHdjJHO1RTaRBlcrMERixmQXt2cqdFZChWehhGcCNXRNd3QilzKoJjRrIWOUFFSTRnbvRlTsVmWaJnU5M2dxB1b0MGT2JTeVZGNrMTVyoEeiZFZkR1MXJWU&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=RdUaWJGUIJUaL5Ed3tUZ5wEejBjT24mM55GT5hEOHp3ZFJ3ZHdWTWt0MLlFc2BnV3EXMnh0VjJEbDJ1cx9SY2h0T0NEW1sEN1RzR44WdL1EWoVVNnVTUXZWVNJlVYFlMKVXc4pkYXpXbRlUdwIDU5lkNatSdUNzL&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=UJmYuZTbU9SMDRHSBpUNl5WQ510Y0MFZRRlbz92N2hmNuxWcZhVVXJHWKF2LNVzS4RmboN3TDtUUXVndvEXYm9SVuZVQplHRMxkWINHRLxUc3FVUUt2cw5mMhZlN3UzSMhFetVXR3VmVFJGO3YXRrVnSUFVS48ke&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mYuZTbU9SMDRHSBpUNl5WQ510Y0MFZRRlbz92N2hmNuxWcZhVVXJHWKF2LNVzS4RmboN3TDtUUXVnd=0zbhJlQ0NDRZB3ZrQTVnZXSD9GMJdFNFdkMJhWazhjezVGVuh3T6VmVFJGO3YXRrVnSUFVS48keUJ&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=y8mSnllavREOOhVOYhlMvFEU2J1UHlEcSJzYkBTSyJWZJZUaEdWeMx0LYdHVn9UOvclMKNGSkR2d5VWeQZnR1V1VEdWNp1ETOdlcslETolUUh1WbllzaoNTexFza69mbOR3NINUR4JTMsZzSSFHe4N2Z61mUxoFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=y8mSnllavREOOhVOYhlMvFEU2J1UHlEcSJzYkBTSyJWZJZUaEdWeMx0LYdHVn9UOvclMKNGSkR2d5VWenR0SzEWSDNTQ4dUbyt0NTVDT3p3U5olRxF2aoNTexFza69mbOR3NINUR4JTMsZzSSFHe4N2Z61mUxoFV&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mSnllavREOOhVOYhlMvFEU2J1UHlEcSJzYkBTSyJWZJZUaEdWeMx0LYdHVn9UOvclMKNGSkR2d5VWe=0zYYRlTiREeUpETDBXWadGasNVcoJzUBBTNDZ0RKp1TKBldHVHU5JTMsZzSSFHe4N2Z61mUxoFVy8&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=WVsZUQFJHMKdVV3YHdu1kRHRHRrV2UrAXdIV3VqpUUDhURal3b5c1Shl1Yzk3QrBnRi5keFdnYU90Q=0TQrETO5NHZzZDVkVDWPFUOuZzKhpmVJlnQxVDaYVTV5NDUyUWVMJXcro1MTp2cDZ2N2x0Zk52ZSt&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=VNjR1KwkHWC92Skl2aCJ1RLd3KqhVWBVkTSRVMWJEdIhldC1US2tiM5BVZaNVM6ZUSil3cmd0T2JnR=0zZ1dETh9UVmVDWkdWUBRXUzATQHVWRW5GR2Y1bGlGZuV3aLVVdGJjY6VkQLRUMI9mMMFnWQh2TJl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=JlVNjR1KwkHWC92Skl2aCJ1RLd3KqhVWBVkTSRVMWJEdIhldC1US2tiM5BVZaNVM6ZUSil3cmd0T2JnRUR2UBx2dlBTVMVjWzdVWDhUYx5EbxkFUxEzQ0FXeDhjMtNkWv4meJd1TGJjY6VkQLRUMI9mMMFnWQh2T&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=lZzLB10NCplUaRFbsN0UOx0MzVnMmdmew82bxRlY2Ulc1hUN3BlYiJHaxZUNvhUYzZjR0o2a4pFdQJWS6dmdshWQ3plMjlUTapVTHZVOwllbphkajFDVHVFaJl1LQtUdqZDbwR2SIh0c5YGZPlDZnJHaXhGUKp3V&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=3tiZMhDayIXZzADbYpneIxkZoNnd6Z1ayRVNpVUeM10T4AzN08kSwskMuZESYNmMxFkboR1YZJnWq1ETsdGc4k1KxokZEJ1VXNjWadEci5Gdq9yZTFTchd3RtlEZFNTZNZjWWJlMkNzal9CMSdzQykVZ5FUTipUc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=vEmZHVjQ2IXd4sWR3cnd1EDU5tSZod1bK1UYpF1QBJletF3K6VUaw80awQFMItUatNFRuVkV6NURM9GUC9iet5EcN12TuZ0LyAzNBlmTzgkaHZ3Yk9ySpNkcQJnSzlWdJ1WdwhWbs5meYhVRnlGMrpkWJZnayMFb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=vEmZHVjQ2IXd4sWR3cnd1EDU5tSZod1bK1UYpF1QBJletF3K6VUaw80awQFMItUatNFRuVkV6NURM9GU1V1QiN0RUlmNL9yLplVU3MjeBh3auZXM5V3SpNkcQJnSzlWdJ1WdwhWbs5meYhVRnlGMrpkWJZnayMFb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=WW1FmR48SZJtycF9CNwAFWVlnNwNWWZlFMhZjSOVDe4gUVw9yN69UNUBlaUJGO4UlTkBnThVlcml1U=0TQYNmV65ERFhTQBl1cix2KBFGaoN0TrRVYzoEeXtkTm1mZ5pkVK9COZF0bJFUevczctZzdlNmays&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=sp1d3ATMI1kV3cnQZl2Y5UWMxlzQMVlcvZ3TGRmWtNUVEl3KatyTkpFdtJTS0UnUMZTQllWeC5GWJpkVHR0UEBlNLlzVuN0MzZmShdHM04Gb5kXSMdkZVNzcwxWYxImUBVTdwM1RzNXMvI0N4IWV1QUdmlzQ6JHc&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1d3ATMI1kV3cnQZl2Y5UWMxlzQMVlcvZ3TGRmWtNUVEl3KatyTkpFdtJTS0UnUMZTQllWeC5GWJpkV=0zdxJEbJV0R5hmaGl1ZwAjNC52N5sUVwh3TGdkcINnV21Eb0YGb0NXMvI0N4IWV1QUdmlzQ6JHcsp&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mT6pHa0kXV1QmaWZjbyY0Vjd3YTpXcy9UMaRTNLVUaOtCS5hEV2d0VhtkSMdGUQJ2MwMVcil3QjxWW=0TWBJHUhlGTKBzVMpVOPtEaxAlRQNjMxoEWyJmT6FkbkVTNWlkNpRUUopGe3JFcvM0RahlRHhmbpl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mT6pHa0kXV1QmaWZjbyY0Vjd3YTpXcy9UMaRTNLVUaOtCS5hEV2d0VhtkSMdGUQJ2MwMVcil3QjxWW=0za14WduBVROFkU0cjNURmWCB1R002dwh3UyJmT6FkbkVTNWlkNpRUUopGe3JFcvM0RahlRHhmbpl&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=0ZqVWbRtWTMdHdr9CdEJ3Sad0cu10KUpWe0ZjQiFERSp0d0AFT352Uxg3M3pVa5onQWRkaDFFcFd1Y=0DOLJnUHVlWsJHaPRXS4sEUwUDZXt2LBl0TlB1NFhUYthlZWhETv1UYzpVaDFWTk5mTqd1Krd1Rxs&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=0ZqVWbRtWTMdHdr9CdEJ3Sad0cu10KUpWe0ZjQiFERSp0d0AFT352Uxg3M3pVa5onQWRkaDFFcFd1Y=0zaIZnUHVlWsJHaPRXS4sEUwUDZXt2LBl0TlB1NFhUYthlZWhETv1UYzpVaDFWTk5mTqd1Krd1Rxs&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=zVDhFN5VjWrRDdNRVYrEkQ0wGaMR3YSNWQwIje2tETqV3Z6l0ZBhmU5sWVWpUTMZkT19mYkpmVZdkZ=0zZnNkWnRGZLZleHFValpWa1smeXdTRxQ2Yk12SydFRQZmY2plVxFHd5UTQk9mNrolZRBVT6NjY4F&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=zVDhFN5VjWrRDdNRVYrEkQ0wGaMR3YSNWQwIje2tETqV3Z6l0ZBhmU5sWVWpUTMZkT19mYkpmVZdkZ=0zaJdmTupFbv8WQVplWPh3KlVTbCF1TPhVYk12SydFRQZmY2plVxFHd5UTQk9mNrolZRBVT6NjY4F&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=zVDhFN5VjWrRDdNRVYrEkQ0wGaMR3YSNWQwIje2tETqV3Z6l0ZBhmU5sWVWpUTMZkT19mYkpmVZdkZ=0DNCF1c1M1N6tkQ4J1Rl9EcvwWQvNGenFWYk12SydFRQZmY2plVxFHd5UTQk9mNrolZRBVT6NjY4F&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mctVnR5cGaSNmWEpmWrknT4RHMsRnNNNEOEdnV1Q0arRWb5VVO0MzYh1UQTVXbCh0cTlVVEJkQClWa=0zYj1WOzQEMQh2TtpUZxQ1V1AHdMhXeqtiZDh3RqVlQykXRXp1SxYzYkR2aMJkSz92MttyUWJGZCh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=mctVnR5cGaSNmWEpmWrknT4RHMsRnNNNEOEdnV1Q0arRWb5VVO0MzYh1UQTVXbCh0cTlVVEJkQClWa=0TUKlVchVnT5sSVS90SihXZ34kVsB3KBl3ZEh3RqVlQykXRXp1SxYzYkR2aMJkSz92MttyUWJGZCh&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=xMVRXpkZWVGMRhHe5pXdVFjSzZGMSZnczsidnBnctZUNJ1EMWJTdYhkWiRFSTRldV9UbzpUTX1kZVRVbVNFOmNWe15GWKVmS4wGUXhWYqhjc2gHZZRTN5E0KTREZWhHUshGRIJURHtkd4dWUBpndCNmWr8UVa5Ga&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=xMVRXpkZWVGMRhHe5pXdVFjSzZGMSZnczsidnBnctZUNJ1EMWJTdYhkWiRFSTRldV9UbzpUTX1kZVRVb2BjSCpEM2UlM4d0QOJWbCtUVIRnelN3U4dGN5E0KTREZWhHUshGRIJURHtkd4dWUBpndCNmWr8UVa5Ga&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=VRXpkZWVGMRhHe5pXdVFjSzZGMSZnczsidnBnctZUNJ1EMWJTdYhkWiRFSTRldV9UbzpUTX1kZVRVb=0zcrg2UxQXQ4IWQ2Mma280axkWUYR2ZDFVd4AXb15kR0o1VqZlbHtkd4dWUBpndCNmWr8UVa5GaxM&tablename=CJFDAUTO&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=2tEUvdWMyQ3bTVFcShjaMhjboxWY4RUYIp1d1Enb4d1aXh0dVpXWnVDWxYFTvJkcCtkbVVXR4ZGV4REctZ1T3plWSpWM3EVNBl3dOpHaMlUUvh3azI3Sh5WUlVzQGVEM2Vla250ZldFSnN0Rn1GMr40R252L4Ezb&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1kGVDRXO0sSdihEOzZzdrR2YqR2NBdlUxhGTaRTS6JUN4dWcxMHSMNDerdHW0FneORmcBZGeYhXeSd2ciVDO08kcuN3aYtUUjhnbMRFNRJWeYZGN3t2RYZkdrZkZMpWQTd2ZjNVaQhjSupWQSZUbnFzLRVHMTd1K&tablename=CAPJLAST&dflag=pdfdown',\n",
       " 'https://kns.cnki.net/kcms/download.aspx?filename=1kGVDRXO0sSdihEOzZzdrR2YqR2NBdlUxhGTaRTS6JUN4dWcxMHSMNDerdHW0FneORmcBZGeYhXeSd2ckJ1YFNHaJh2Kj12djRmU2dmWTdDajRkQKF0RYZkdrZkZMpWQTd2ZjNVaQhjSupWQSZUbnFzLRVHMTd1K&tablename=CAPJLAST&dflag=pdfdown']"
      ]
     },
     "execution_count": 28,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 完整链接\n",
    "pdf_href=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "pdf_href"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 24,
   "metadata": {},
   "outputs": [],
   "source": [
    "nextpage = driver.find_element_by_id('PageNext')\n",
    "all = driver.find_element_by_xpath('//*[@id=\"selectCheckAll1\"]')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>1</td>\n",
       "      <td>机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发</td>\n",
       "      <td>代林序; 张玉洁</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>2</td>\n",
       "      <td>关于智能化战争的基本认知  网络首发</td>\n",
       "      <td>郭明</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-07-02 15:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>3</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>4</td>\n",
       "      <td>卫星在轨故障案例与人工智能故障诊断  网络首发</td>\n",
       "      <td>王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬</td>\n",
       "      <td>中国空间科学技术</td>\n",
       "      <td>2021-07-02 08:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>5</td>\n",
       "      <td>高等职业教育智能生态系统:内涵、结构与实践路径</td>\n",
       "      <td>徐晔</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>6</td>\n",
       "      <td>近20年在线学习环境研究评述——基于LDA和DTM的动态分析</td>\n",
       "      <td>牛晓杰; 郑勤华</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>7</td>\n",
       "      <td>教育人工智能场域下教师角色与行动取向</td>\n",
       "      <td>赵磊磊; 马玉菲; 代蕊华</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>8</td>\n",
       "      <td>智能财务人才培养与浙江大学的探索  网络首发</td>\n",
       "      <td>陈俊; 董望</td>\n",
       "      <td>财会月刊</td>\n",
       "      <td>2021-07-01 15:42</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>9</td>\n",
       "      <td>机器学习在智能配用电领域的应用：北美工程实践概述  网络首发</td>\n",
       "      <td>李亦言; 胡荣兴; 宋立冬; 贾乾罡; 陆宁</td>\n",
       "      <td>电力系统自动化</td>\n",
       "      <td>2021-07-01 09:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>10</td>\n",
       "      <td>国际经贸协定中的源代码规则新发展及中国立场  网络首发</td>\n",
       "      <td>鄢雨虹</td>\n",
       "      <td>武大国际法评论</td>\n",
       "      <td>2021-07-01 09:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>11</td>\n",
       "      <td>人工智能赋能高校数据治理：逻辑、挑战与实践  网络首发</td>\n",
       "      <td>赵磊磊</td>\n",
       "      <td>重庆高教研究</td>\n",
       "      <td>2021-06-30 14:14</td>\n",
       "      <td>NaN</td>\n",
       "      <td>114.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>12</td>\n",
       "      <td>嵌入式神经网络加速器及SoC芯片  网络首发</td>\n",
       "      <td>易冬柏; 陈恒; 何乐年</td>\n",
       "      <td>仪器仪表学报</td>\n",
       "      <td>2021-06-30 10:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>59.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>13</td>\n",
       "      <td>绿色理念下智慧零售创新发展路径</td>\n",
       "      <td>翟璇</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>14</td>\n",
       "      <td>数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》</td>\n",
       "      <td>单浩耘</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-30</td>\n",
       "      <td>NaN</td>\n",
       "      <td>15.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>15</td>\n",
       "      <td>智能化金融监管：模型框架、边缘约束和实践策略  网络首发</td>\n",
       "      <td>乔宇锋</td>\n",
       "      <td>南方金融</td>\n",
       "      <td>2021-06-29 17:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>105.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>16</td>\n",
       "      <td>“智能+”时代的现代文化产业体系：挑战与重塑</td>\n",
       "      <td>解学芳; 雷文宣</td>\n",
       "      <td>深圳大学学报(人文社会科学版)</td>\n",
       "      <td>2021-06-29 15:45</td>\n",
       "      <td>NaN</td>\n",
       "      <td>65.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>17</td>\n",
       "      <td>人工智能在胸部创伤肋骨骨折CT诊断中应用的初步研究  网络首发</td>\n",
       "      <td>刘想;谢辉辉;许玉峰;陶晓峰;柳林</td>\n",
       "      <td>上海交通大学学报(医学版)</td>\n",
       "      <td>2021-06-29 14:47</td>\n",
       "      <td>NaN</td>\n",
       "      <td>38.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>17</th>\n",
       "      <td>18</td>\n",
       "      <td>人工智能技术在火电行业的应用探讨  网络首发</td>\n",
       "      <td>华志刚; 范佳卿; 郭荣; 汪勇; 吴潇翔</td>\n",
       "      <td>中国电力</td>\n",
       "      <td>2021-06-29 11:10</td>\n",
       "      <td>NaN</td>\n",
       "      <td>127.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>18</th>\n",
       "      <td>19</td>\n",
       "      <td>基于切换输出机制的超短期风电功率预测  网络首发</td>\n",
       "      <td>杨茂; 许传宇; 王凯旋</td>\n",
       "      <td>高电压技术</td>\n",
       "      <td>2021-06-29 11:02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>23.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>19</th>\n",
       "      <td>20</td>\n",
       "      <td>DCN:双通道密集哈达玛卷积的画质评价网络  网络首发</td>\n",
       "      <td>杨晓东; 韩振奇; 刘立庄; 赵丹</td>\n",
       "      <td>计算机工程与应用</td>\n",
       "      <td>2021-06-29 09:20</td>\n",
       "      <td>NaN</td>\n",
       "      <td>26.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>20</th>\n",
       "      <td>21</td>\n",
       "      <td>智能交通管理系统发展趋势  网络首发</td>\n",
       "      <td>李瑞敏; 王长君</td>\n",
       "      <td>清华大学学报(自然科学版)</td>\n",
       "      <td>2021-06-29 08:59</td>\n",
       "      <td>NaN</td>\n",
       "      <td>94.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>21</th>\n",
       "      <td>22</td>\n",
       "      <td>人工智能写作背景下作者主体性的消解与重构——以陈楸帆人机交互写作实验为中心</td>\n",
       "      <td>周建琼</td>\n",
       "      <td>当代文坛</td>\n",
       "      <td>2021-06-29</td>\n",
       "      <td>NaN</td>\n",
       "      <td>28.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>22</th>\n",
       "      <td>23</td>\n",
       "      <td>空气源热泵除霜控制方法研究现状及展望  网络首发</td>\n",
       "      <td>王沣浩; 马龙霞; 王志华; 楼业春; 刘孜璇</td>\n",
       "      <td>制冷学报</td>\n",
       "      <td>2021-06-28 10:21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>60.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>23</th>\n",
       "      <td>24</td>\n",
       "      <td>面向机器人自主分割的肉品识别分类系统实现  网络首发</td>\n",
       "      <td>马欢; 冀晶晶; 刘佳豪; 刘雨婷</td>\n",
       "      <td>图学学报</td>\n",
       "      <td>2021-06-28 08:48</td>\n",
       "      <td>NaN</td>\n",
       "      <td>150.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>24</th>\n",
       "      <td>25</td>\n",
       "      <td>AI辅助头颈CTA在诊断颅内动脉瘤中的应用</td>\n",
       "      <td>邓昊;韦鑫;曹闻挺;艾光勇;余菡</td>\n",
       "      <td>第三军医大学学报</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>25</th>\n",
       "      <td>26</td>\n",
       "      <td>人工智能模型预测输尿管结石自然排出的多中心临床试验的验证研究</td>\n",
       "      <td>曾凯; 王新敏; 倪钊; 王勤章; 李强</td>\n",
       "      <td>中国全科医学</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>26</th>\n",
       "      <td>27</td>\n",
       "      <td>城市暴雨内涝综述：特征、机理、数据与方法</td>\n",
       "      <td>黄华兵; 王先伟; 柳林</td>\n",
       "      <td>地理科学进展</td>\n",
       "      <td>2021-06-28</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>27</th>\n",
       "      <td>28</td>\n",
       "      <td>基于计算机视觉的织物光泽测试方法研究  网络首发</td>\n",
       "      <td>张建新; 黄钢; 李消晋</td>\n",
       "      <td>丝绸</td>\n",
       "      <td>2021-06-25 17:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>271.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>28</th>\n",
       "      <td>29</td>\n",
       "      <td>MIT Technology Review 2021年“十大突破性技术”解读  网络首发</td>\n",
       "      <td>祁海;张民;李俊涛;张小松;张强</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-06-25 17:07</td>\n",
       "      <td>NaN</td>\n",
       "      <td>140.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>29</th>\n",
       "      <td>30</td>\n",
       "      <td>基于区块链的联邦学习技术综述  网络首发</td>\n",
       "      <td>李凌霄;袁莎;金银玉</td>\n",
       "      <td>计算机应用研究</td>\n",
       "      <td>2021-06-25 16:23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>365.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>30</th>\n",
       "      <td>31</td>\n",
       "      <td>竞技二打一游戏中同等牌力的研究  网络首发</td>\n",
       "      <td>李淑琴; 陈子鹏; 郑蓝舟; 孟坤</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-25 16:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>84.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>31</th>\n",
       "      <td>32</td>\n",
       "      <td>新信息技术对高等教育影响的演变及反思——基于2004-2021年《地平线报告》内容分析  网络首发</td>\n",
       "      <td>梁志星; 冯兴杰; 李佳; 杨珂</td>\n",
       "      <td>当代教育论坛</td>\n",
       "      <td>2021-06-25 16:03</td>\n",
       "      <td>NaN</td>\n",
       "      <td>199.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>32</th>\n",
       "      <td>33</td>\n",
       "      <td>机器人示教学习与技能泛化实验设计</td>\n",
       "      <td>占宏; 李娴; 杨辰光</td>\n",
       "      <td>实验技术与管理</td>\n",
       "      <td>2021-06-25 15:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>79.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>33</th>\n",
       "      <td>34</td>\n",
       "      <td>CoTransH: 科技文献知识图谱中语义关系预测的翻译模型  网络首发</td>\n",
       "      <td>陶玥; 余丽; 吴振新</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-25 11:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>88.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>34</th>\n",
       "      <td>35</td>\n",
       "      <td>管道数字孪生体模型的构建及应用</td>\n",
       "      <td>陈斯迅;李在蓉;王禹钦;关红亮;高丽</td>\n",
       "      <td>油气储运</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>220.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>35</th>\n",
       "      <td>36</td>\n",
       "      <td>清华大学TH-Health研究室简介</td>\n",
       "      <td>NaN</td>\n",
       "      <td>针刺研究</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>18.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>36</th>\n",
       "      <td>37</td>\n",
       "      <td>大数据智能时代地图学课程内容改革探索</td>\n",
       "      <td>刘慧敏; 邓敏; 刘宝举; 陈杰</td>\n",
       "      <td>测绘通报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>37</th>\n",
       "      <td>38</td>\n",
       "      <td>机器人智能化焊接技术发展综述及其在运载火箭贮箱中的应用</td>\n",
       "      <td>林尚扬;杨学勤;徐爱杰;陈华斌;林涛</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>24.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>38</th>\n",
       "      <td>39</td>\n",
       "      <td>智能博弈趋势下未来空天防御体系展望</td>\n",
       "      <td>王波兰</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>13.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>39</th>\n",
       "      <td>40</td>\n",
       "      <td>未来智能化网络化多功能卫星系统技术发展思考</td>\n",
       "      <td>陈占胜</td>\n",
       "      <td>上海航天(中英文)</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>9.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>40</th>\n",
       "      <td>41</td>\n",
       "      <td>人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》</td>\n",
       "      <td>张诗雨</td>\n",
       "      <td>锻压技术</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>6.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>41</th>\n",
       "      <td>42</td>\n",
       "      <td>新型机械导航系统辅助穿刺初步实验研究</td>\n",
       "      <td>文艺; 李晓冰; 吴智群</td>\n",
       "      <td>介入放射学杂志</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>1.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>42</th>\n",
       "      <td>43</td>\n",
       "      <td>人机对抗智能技术最新进展及军事应用</td>\n",
       "      <td>聂凯; 曾科军; 孟庆海; 魏超</td>\n",
       "      <td>兵器装备工程学报</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>29.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>43</th>\n",
       "      <td>44</td>\n",
       "      <td>人工智能时代高校翻译技术实践环境建设研究</td>\n",
       "      <td>曹达钦; 戴钰涵</td>\n",
       "      <td>外语界</td>\n",
       "      <td>2021-06-25</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>44</th>\n",
       "      <td>45</td>\n",
       "      <td>融合视觉显著性再检测的孪生网络无人机目标跟踪算法  网络首发</td>\n",
       "      <td>周士琪; 王耀南; 钟杭</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-23 15:11</td>\n",
       "      <td>NaN</td>\n",
       "      <td>217.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>45</th>\n",
       "      <td>46</td>\n",
       "      <td>军事智能化的瓶颈与关键问题研究  网络首发</td>\n",
       "      <td>刘伟</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-06-23 14:04</td>\n",
       "      <td>NaN</td>\n",
       "      <td>80.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>46</th>\n",
       "      <td>47</td>\n",
       "      <td>思索·睿智:迷雾中的笃行要件——记第55次情报科学读书会</td>\n",
       "      <td>于伟; 苏鹏</td>\n",
       "      <td>情报理论与实践</td>\n",
       "      <td>2021-06-23</td>\n",
       "      <td>NaN</td>\n",
       "      <td>19.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>47</th>\n",
       "      <td>48</td>\n",
       "      <td>多智能体协作场景下基于强化学习值分解的计算卸载策略  网络首发</td>\n",
       "      <td>张鹏; 田辉; 赵鹏涛; 贺硕; 童一帆</td>\n",
       "      <td>通信学报</td>\n",
       "      <td>2021-06-22 16:50</td>\n",
       "      <td>NaN</td>\n",
       "      <td>160.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>48</th>\n",
       "      <td>49</td>\n",
       "      <td>人工智能范式的革命与通用智能理论的创生  网络首发</td>\n",
       "      <td>钟义信</td>\n",
       "      <td>智能系统学报</td>\n",
       "      <td>2021-06-22 15:09</td>\n",
       "      <td>NaN</td>\n",
       "      <td>165.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>49</th>\n",
       "      <td>50</td>\n",
       "      <td>基于人工智能算法的作业现场人员设备资质识别技术研究  网络首发</td>\n",
       "      <td>陈晓江; 龙震岳; 曾纪钧</td>\n",
       "      <td>电测与仪表</td>\n",
       "      <td>2021-06-22 10:38</td>\n",
       "      <td>NaN</td>\n",
       "      <td>192.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "    Unnamed: 0                                                 篇名  \\\n",
       "0            1    机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发   \n",
       "1            2                                 关于智能化战争的基本认知  网络首发   \n",
       "2            3                         金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "3            4                            卫星在轨故障案例与人工智能故障诊断  网络首发   \n",
       "4            5                            高等职业教育智能生态系统:内涵、结构与实践路径   \n",
       "5            6                     近20年在线学习环境研究评述——基于LDA和DTM的动态分析   \n",
       "6            7                                 教育人工智能场域下教师角色与行动取向   \n",
       "7            8                             智能财务人才培养与浙江大学的探索  网络首发   \n",
       "8            9                     机器学习在智能配用电领域的应用：北美工程实践概述  网络首发   \n",
       "9           10                        国际经贸协定中的源代码规则新发展及中国立场  网络首发   \n",
       "10          11                        人工智能赋能高校数据治理：逻辑、挑战与实践  网络首发   \n",
       "11          12                             嵌入式神经网络加速器及SoC芯片  网络首发   \n",
       "12          13                                    绿色理念下智慧零售创新发展路径   \n",
       "13          14                 数字经济视野下跨境电商企业的升级策略研究——评《跨境电商与国际物流》   \n",
       "14          15                       智能化金融监管：模型框架、边缘约束和实践策略  网络首发   \n",
       "15          16                             “智能+”时代的现代文化产业体系：挑战与重塑   \n",
       "16          17                    人工智能在胸部创伤肋骨骨折CT诊断中应用的初步研究  网络首发   \n",
       "17          18                             人工智能技术在火电行业的应用探讨  网络首发   \n",
       "18          19                           基于切换输出机制的超短期风电功率预测  网络首发   \n",
       "19          20                        DCN:双通道密集哈达玛卷积的画质评价网络  网络首发   \n",
       "20          21                                 智能交通管理系统发展趋势  网络首发   \n",
       "21          22              人工智能写作背景下作者主体性的消解与重构——以陈楸帆人机交互写作实验为中心   \n",
       "22          23                           空气源热泵除霜控制方法研究现状及展望  网络首发   \n",
       "23          24                         面向机器人自主分割的肉品识别分类系统实现  网络首发   \n",
       "24          25                              AI辅助头颈CTA在诊断颅内动脉瘤中的应用   \n",
       "25          26                     人工智能模型预测输尿管结石自然排出的多中心临床试验的验证研究   \n",
       "26          27                               城市暴雨内涝综述：特征、机理、数据与方法   \n",
       "27          28                           基于计算机视觉的织物光泽测试方法研究  网络首发   \n",
       "28          29       MIT Technology Review 2021年“十大突破性技术”解读  网络首发   \n",
       "29          30                               基于区块链的联邦学习技术综述  网络首发   \n",
       "30          31                              竞技二打一游戏中同等牌力的研究  网络首发   \n",
       "31          32  新信息技术对高等教育影响的演变及反思——基于2004-2021年《地平线报告》内容分析  网络首发   \n",
       "32          33                                   机器人示教学习与技能泛化实验设计   \n",
       "33          34               CoTransH: 科技文献知识图谱中语义关系预测的翻译模型  网络首发   \n",
       "34          35                                    管道数字孪生体模型的构建及应用   \n",
       "35          36                                 清华大学TH-Health研究室简介   \n",
       "36          37                                 大数据智能时代地图学课程内容改革探索   \n",
       "37          38                        机器人智能化焊接技术发展综述及其在运载火箭贮箱中的应用   \n",
       "38          39                                  智能博弈趋势下未来空天防御体系展望   \n",
       "39          40                              未来智能化网络化多功能卫星系统技术发展思考   \n",
       "40          41  人工智能方法在热模锻压力机故障诊断技术中的应用——评《实用模具设计与生产应用手册：挤压模与热锻模》   \n",
       "41          42                                 新型机械导航系统辅助穿刺初步实验研究   \n",
       "42          43                                  人机对抗智能技术最新进展及军事应用   \n",
       "43          44                               人工智能时代高校翻译技术实践环境建设研究   \n",
       "44          45                     融合视觉显著性再检测的孪生网络无人机目标跟踪算法  网络首发   \n",
       "45          46                              军事智能化的瓶颈与关键问题研究  网络首发   \n",
       "46          47                       思索·睿智:迷雾中的笃行要件——记第55次情报科学读书会   \n",
       "47          48                    多智能体协作场景下基于强化学习值分解的计算卸载策略  网络首发   \n",
       "48          49                          人工智能范式的革命与通用智能理论的创生  网络首发   \n",
       "49          50                    基于人工智能算法的作业现场人员设备资质识别技术研究  网络首发   \n",
       "\n",
       "                         作者               刊名              发表时间  被引     下载  操作  \\\n",
       "0                  代林序; 张玉洁            档案与建设  2021-07-02 16:16 NaN    NaN  下载   \n",
       "1                        郭明        人民论坛·学术前沿  2021-07-02 15:49 NaN    NaN  下载   \n",
       "2             陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN    NaN  下载   \n",
       "3        王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬         中国空间科学技术  2021-07-02 08:49 NaN    NaN  下载   \n",
       "4                        徐晔           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "5                  牛晓杰; 郑勤华           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "6             赵磊磊; 马玉菲; 代蕊华           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "7                    陈俊; 董望             财会月刊  2021-07-01 15:42 NaN    NaN  下载   \n",
       "8    李亦言; 胡荣兴; 宋立冬; 贾乾罡; 陆宁          电力系统自动化  2021-07-01 09:50 NaN    NaN  下载   \n",
       "9                       鄢雨虹          武大国际法评论  2021-07-01 09:16 NaN    NaN  下载   \n",
       "10                      赵磊磊           重庆高教研究  2021-06-30 14:14 NaN  114.0  下载   \n",
       "11             易冬柏; 陈恒; 何乐年           仪器仪表学报  2021-06-30 10:09 NaN   59.0  下载   \n",
       "12                       翟璇           商业经济研究        2021-06-30 NaN    6.0  下载   \n",
       "13                      单浩耘           商业经济研究        2021-06-30 NaN   15.0  下载   \n",
       "14                      乔宇锋             南方金融  2021-06-29 17:04 NaN  105.0  下载   \n",
       "15                 解学芳; 雷文宣  深圳大学学报(人文社会科学版)  2021-06-29 15:45 NaN   65.0  下载   \n",
       "16        刘想;谢辉辉;许玉峰;陶晓峰;柳林    上海交通大学学报(医学版)  2021-06-29 14:47 NaN   38.0  下载   \n",
       "17    华志刚; 范佳卿; 郭荣; 汪勇; 吴潇翔             中国电力  2021-06-29 11:10 NaN  127.0  下载   \n",
       "18             杨茂; 许传宇; 王凯旋            高电压技术  2021-06-29 11:02 NaN   23.0  下载   \n",
       "19        杨晓东; 韩振奇; 刘立庄; 赵丹         计算机工程与应用  2021-06-29 09:20 NaN   26.0  下载   \n",
       "20                 李瑞敏; 王长君    清华大学学报(自然科学版)  2021-06-29 08:59 NaN   94.0  下载   \n",
       "21                      周建琼             当代文坛        2021-06-29 NaN   28.0  下载   \n",
       "22  王沣浩; 马龙霞; 王志华; 楼业春; 刘孜璇             制冷学报  2021-06-28 10:21 NaN   60.0  下载   \n",
       "23        马欢; 冀晶晶; 刘佳豪; 刘雨婷             图学学报  2021-06-28 08:48 NaN  150.0  下载   \n",
       "24         邓昊;韦鑫;曹闻挺;艾光勇;余菡         第三军医大学学报        2021-06-28 NaN    6.0  下载   \n",
       "25     曾凯; 王新敏; 倪钊; 王勤章; 李强           中国全科医学        2021-06-28 NaN   18.0  下载   \n",
       "26             黄华兵; 王先伟; 柳林           地理科学进展        2021-06-28 NaN    NaN  下载   \n",
       "27             张建新; 黄钢; 李消晋               丝绸  2021-06-25 17:11 NaN  271.0  下载   \n",
       "28         祁海;张民;李俊涛;张小松;张强           中国科学基金  2021-06-25 17:07 NaN  140.0  下载   \n",
       "29               李凌霄;袁莎;金银玉          计算机应用研究  2021-06-25 16:23 NaN  365.0  下载   \n",
       "30        李淑琴; 陈子鹏; 郑蓝舟; 孟坤           智能系统学报  2021-06-25 16:03 NaN   84.0  下载   \n",
       "31         梁志星; 冯兴杰; 李佳; 杨珂           当代教育论坛  2021-06-25 16:03 NaN  199.0  下载   \n",
       "32              占宏; 李娴; 杨辰光          实验技术与管理  2021-06-25 15:39 NaN   79.0  下载   \n",
       "33              陶玥; 余丽; 吴振新          情报理论与实践  2021-06-25 11:16 NaN   88.0  下载   \n",
       "34       陈斯迅;李在蓉;王禹钦;关红亮;高丽             油气储运        2021-06-25 NaN  220.0  下载   \n",
       "35                      NaN             针刺研究        2021-06-25 NaN   18.0  下载   \n",
       "36         刘慧敏; 邓敏; 刘宝举; 陈杰             测绘通报        2021-06-25 NaN   24.0  下载   \n",
       "37       林尚扬;杨学勤;徐爱杰;陈华斌;林涛        上海航天(中英文)        2021-06-25 NaN   24.0  下载   \n",
       "38                      王波兰        上海航天(中英文)        2021-06-25 NaN   13.0  下载   \n",
       "39                      陈占胜        上海航天(中英文)        2021-06-25 NaN    9.0  下载   \n",
       "40                      张诗雨             锻压技术        2021-06-25 NaN    6.0  下载   \n",
       "41             文艺; 李晓冰; 吴智群          介入放射学杂志        2021-06-25 NaN    1.0  下载   \n",
       "42         聂凯; 曾科军; 孟庆海; 魏超         兵器装备工程学报        2021-06-25 NaN   29.0  下载   \n",
       "43                 曹达钦; 戴钰涵              外语界        2021-06-25 NaN    NaN  下载   \n",
       "44             周士琪; 王耀南; 钟杭           智能系统学报  2021-06-23 15:11 NaN  217.0  下载   \n",
       "45                       刘伟        人民论坛·学术前沿  2021-06-23 14:04 NaN   80.0  下载   \n",
       "46                   于伟; 苏鹏          情报理论与实践        2021-06-23 NaN   19.0  下载   \n",
       "47     张鹏; 田辉; 赵鹏涛; 贺硕; 童一帆             通信学报  2021-06-22 16:50 NaN  160.0  下载   \n",
       "48                      钟义信           智能系统学报  2021-06-22 15:09 NaN  165.0  下载   \n",
       "49            陈晓江; 龙震岳; 曾纪钧            电测与仪表  2021-06-22 10:38 NaN  192.0  下载   \n",
       "\n",
       "                                                详细页链接  \\\n",
       "0   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "5   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "6   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "7   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "8   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "9   https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "10  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "11  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "12  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "13  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "14  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "15  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "16  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "17  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "18  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "19  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "20  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "21  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "22  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "23  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "24  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "25  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "26  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "27  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "28  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "29  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "30  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "31  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "32  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "33  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "34  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "35  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "36  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "37  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "38  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "39  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "40  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "41  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "42  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "43  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "44  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "45  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "46  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "47  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "48  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "49  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                              PDF下载链接  \n",
       "0   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "5   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "6   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "7   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "8   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "9   https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "10  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "11  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "12  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "13  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "14  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "15  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "16  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "17  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "18  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "19  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "20  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "21  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "22  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "23  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "24  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "25  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "26  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "27  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "28  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "29  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "30  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "31  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "32  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "33  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "34  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "35  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "36  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "37  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "38  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "39  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "40  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "41  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "42  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "43  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "44  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "45  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "46  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "47  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "48  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "49  https://kns.cnki.net/kcms/download.aspx?filena...  "
      ]
     },
     "execution_count": 29,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_pdf_links=pd.DataFrame({'PDF下载链接':pdf_href})\n",
    "df_首页=pd.concat([df_首页,df_pdf_links],axis=1)\n",
    "df_首页"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 翻页"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 30,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'下一页'"
      ]
     },
     "execution_count": 30,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "element = driver.find_element_by_id('PageNext')\n",
    "element.get_attribute('innerHTML')"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 31,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "'1/120'"
      ]
     },
     "execution_count": 31,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "# 查看上限\n",
    "element = driver.find_element_by_xpath('//span[@class=\"countPageMark\"]')\n",
    "page_str = element.get_attribute('innerHTML')\n",
    "page_str "
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 32,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "[1, 2, 3, 4, 5, 6, 7, 8, 9, 10, 11, 12, 13, 14, 15, 16]"
      ]
     },
     "execution_count": 32,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "page_int = page_str.split('/')\n",
    "pages = list(range(1,int(page_int[1])+1))\n",
    "# 设置爬取页数\n",
    "pages = list(range(1,17))\n",
    "pages"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 29,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-29-889a0c377e4b>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[2])\n"
     ]
    }
   ],
   "source": [
    "# 切换窗口\n",
    "driver.switch_to_window(driver.window_handles[2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 33,
   "metadata": {},
   "outputs": [],
   "source": [
    "import time"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 34,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\t2\t3\t4\t5\t6\t7\t8\t9\t10\t11\t12\t13\t14\t15\t16\t"
     ]
    }
   ],
   "source": [
    "root_group=[]\n",
    "\n",
    "表格_html = dict()\n",
    "main_content =\"\"\n",
    "element = None\n",
    "\n",
    "def page_process(pages):\n",
    "    \"\"\"CNKI翻页获取信息\"\"\"\n",
    "    for p in pages:\n",
    "        print(p,end='\\t')\n",
    "        driver.find_element_by_id('PageNext').click()\n",
    "        time.sleep(15)\n",
    "        \n",
    "        html=driver.page_source\n",
    "        root=fromstring(html)\n",
    "        root_group.append(root)\n",
    "        \n",
    "        element = driver.find_element_by_id('gridTable')\n",
    "        main_content = element.get_attribute('innerHTML')\n",
    "        表格_html[p] = main_content\n",
    "page_process(pages)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 35,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>html_snippets</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>5</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>6</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>7</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>8</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>9</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>10</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>11</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>12</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>13</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>14</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>15</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>16</th>\n",
       "      <td>\\n&lt;div class=\"toolbar\"&gt;&lt;div id=\"countPageDiv\" ...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "</div>"
      ],
      "text/plain": [
       "                                        html_snippets\n",
       "1   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "2   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "3   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "4   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "5   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "6   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "7   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "8   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "9   \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "10  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "11  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "12  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "13  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "14  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "15  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ...\n",
       "16  \\n<div class=\"toolbar\"><div id=\"countPageDiv\" ..."
      ]
     },
     "execution_count": 35,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df = pd.DataFrame([表格_html]).T\n",
    "df.columns = [\"html_snippets\"]\n",
    "df"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 36,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>基于5G与AI的生态环境监测网络平台探讨</td>\n",
       "      <td>徐爱兰; 耿建生</td>\n",
       "      <td>环境监测管理与技术</td>\n",
       "      <td>2021-06-22</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>一种小地质体智能综合方法  网络首发</td>\n",
       "      <td>何文娜;朱长青;徐可;陈圆圆;李仰春</td>\n",
       "      <td>地球物理学进展</td>\n",
       "      <td>2021-06-21 15:33</td>\n",
       "      <td>NaN</td>\n",
       "      <td>87.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>能源转型背景下电力系统不确定性及应对方法综述  网络首发</td>\n",
       "      <td>徐潇源;王晗;严正;鲁卓欣;康重庆</td>\n",
       "      <td>电力系统自动化</td>\n",
       "      <td>2021-06-21 13:13</td>\n",
       "      <td>NaN</td>\n",
       "      <td>229.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>机器人辅助椎体后凸成形术治疗单/双节段骨质疏松性椎体压缩骨折临床疗效  网络首发</td>\n",
       "      <td>袁伟;孟小童;刘欣春;朱海涛;丛琳</td>\n",
       "      <td>中国修复重建外科杂志</td>\n",
       "      <td>2021-06-21 10:47</td>\n",
       "      <td>NaN</td>\n",
       "      <td>44.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>人工智能价值网络下零售企业商业模式创新与企业效益相关性分析</td>\n",
       "      <td>郭漫勤; 师佳英</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>240.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>846</td>\n",
       "      <td>数字经济研究·主持人语</td>\n",
       "      <td>谢康</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>847</td>\n",
       "      <td>“一带一路”数字经济的发展图景与法治路径</td>\n",
       "      <td>赵骏</td>\n",
       "      <td>中国法律评论</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>473.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>848</td>\n",
       "      <td>智能产业生态系统的结构性特征及发展路径</td>\n",
       "      <td>杜爽</td>\n",
       "      <td>经济纵横</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>144.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>849</td>\n",
       "      <td>一纸风行到一端在手——《华西都市报》的转型探析</td>\n",
       "      <td>刘洁</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>850</td>\n",
       "      <td>“物联网+人工智能”：Web3.0时代的数字传媒发展初探</td>\n",
       "      <td>冉凌宇</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>241.0</td>\n",
       "      <td>下载</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 8 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                        篇名                  作者  \\\n",
       "0            51                      基于5G与AI的生态环境监测网络平台探讨            徐爱兰; 耿建生   \n",
       "1            52                        一种小地质体智能综合方法  网络首发  何文娜;朱长青;徐可;陈圆圆;李仰春   \n",
       "2            53              能源转型背景下电力系统不确定性及应对方法综述  网络首发   徐潇源;王晗;严正;鲁卓欣;康重庆   \n",
       "3            54  机器人辅助椎体后凸成形术治疗单/双节段骨质疏松性椎体压缩骨折临床疗效  网络首发   袁伟;孟小童;刘欣春;朱海涛;丛琳   \n",
       "4            55             人工智能价值网络下零售企业商业模式创新与企业效益相关性分析            郭漫勤; 师佳英   \n",
       "..          ...                                       ...                 ...   \n",
       "795         846                               数字经济研究·主持人语                  谢康   \n",
       "796         847                      “一带一路”数字经济的发展图景与法治路径                  赵骏   \n",
       "797         848                       智能产业生态系统的结构性特征及发展路径                  杜爽   \n",
       "798         849                   一纸风行到一端在手——《华西都市报》的转型探析                  刘洁   \n",
       "799         850              “物联网+人工智能”：Web3.0时代的数字传媒发展初探                 冉凌宇   \n",
       "\n",
       "                  刊名              发表时间  被引     下载  操作  \n",
       "0          环境监测管理与技术        2021-06-22 NaN  186.0  下载  \n",
       "1            地球物理学进展  2021-06-21 15:33 NaN   87.0  下载  \n",
       "2            电力系统自动化  2021-06-21 13:13 NaN  229.0  下载  \n",
       "3         中国修复重建外科杂志  2021-06-21 10:47 NaN   44.0  下载  \n",
       "4             商业经济研究        2021-06-21 NaN  240.0  下载  \n",
       "..               ...               ...  ..    ...  ..  \n",
       "795  北京交通大学学报(社会科学版)        2021-04-15 NaN   49.0  下载  \n",
       "796           中国法律评论        2021-04-15 NaN  473.0  下载  \n",
       "797             经济纵横        2021-04-15 NaN  144.0  下载  \n",
       "798             出版广角        2021-04-15 NaN   58.0  下载  \n",
       "799             出版广角        2021-04-15 NaN  241.0  下载  \n",
       "\n",
       "[800 rows x 8 columns]"
      ]
     },
     "execution_count": 36,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "l_df = []\n",
    "for p in pages:\n",
    "    表格 = pd.read_html(表格_html[p])[0]\n",
    "    l_df.append(表格)\n",
    "df_url_out = pd.concat(l_df).reset_index(drop=True)\n",
    "df_url_out"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 37,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 详细页链接\n",
    "href_group=[]\n",
    "\n",
    "for root in root_group:\n",
    "    href = root.xpath('.//*[@id=\"gridTable\"]/table/tbody/tr/td[2]/a/@href')\n",
    "    href_group.append(href)\n",
    "    \n",
    "href_group=href_group[0]+href_group[1]+href_group[2]+href_group[3]+href_group[4]+href_group[5]+href_group[6]+href_group[7]+href_group[8]+href_group[9]+href_group[10]+href_group[11]+href_group[12]+href_group[13]+href_group[14]+href_group[15]"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 38,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>详细页链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 详细页链接\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "..                                                 ...\n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...\n",
       "\n",
       "[800 rows x 1 columns]"
      ]
     },
     "execution_count": 38,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "href_group_correct=[correct(x) for x in href_group]\n",
    "df_link=pd.DataFrame({'详细页链接':href_group_correct})\n",
    "df_link"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 39,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "1\n",
      "2\n",
      "3\n",
      "4\n",
      "5\n",
      "6\n",
      "7\n",
      "8\n",
      "9\n",
      "10\n",
      "11\n",
      "12\n",
      "13\n",
      "14\n",
      "15\n",
      "16\n",
      "17\n",
      "18\n",
      "19\n",
      "20\n",
      "21\n",
      "22\n",
      "23\n",
      "24\n",
      "25\n",
      "26\n",
      "27\n",
      "28\n",
      "29\n",
      "30\n",
      "31\n",
      "32\n",
      "33\n",
      "34\n",
      "35\n",
      "36\n",
      "37\n",
      "38\n",
      "39\n",
      "40\n",
      "41\n",
      "42\n",
      "43\n",
      "44\n",
      "45\n",
      "46\n",
      "47\n",
      "48\n",
      "49\n",
      "50\n",
      "51\n",
      "52\n",
      "53\n",
      "54\n",
      "55\n",
      "56\n",
      "57\n",
      "58\n",
      "59\n",
      "60\n",
      "61\n",
      "62\n",
      "63\n",
      "64\n",
      "65\n",
      "66\n",
      "67\n",
      "68\n",
      "69\n",
      "70\n",
      "71\n",
      "72\n",
      "73\n",
      "74\n",
      "75\n",
      "76\n",
      "77\n",
      "78\n",
      "79\n",
      "80\n",
      "81\n",
      "82\n",
      "83\n",
      "84\n",
      "85\n",
      "86\n",
      "87\n",
      "88\n",
      "89\n",
      "90\n",
      "91\n",
      "92\n",
      "93\n",
      "94\n",
      "95\n",
      "96\n",
      "97\n",
      "98\n",
      "99\n",
      "100\n",
      "101\n",
      "102\n",
      "103\n",
      "104\n",
      "105\n",
      "106\n",
      "107\n",
      "108\n",
      "109\n",
      "110\n",
      "111\n",
      "112\n",
      "113\n",
      "114\n",
      "115\n",
      "116\n",
      "117\n",
      "118\n",
      "119\n",
      "120\n",
      "121\n",
      "122\n",
      "123\n",
      "124\n",
      "125\n",
      "126\n",
      "127\n",
      "128\n",
      "129\n",
      "130\n",
      "131\n",
      "132\n",
      "133\n",
      "134\n",
      "135\n",
      "136\n",
      "137\n",
      "138\n",
      "139\n",
      "140\n",
      "141\n",
      "142\n",
      "143\n",
      "144\n",
      "145\n",
      "146\n",
      "147\n",
      "148\n",
      "149\n",
      "150\n",
      "151\n",
      "152\n",
      "153\n",
      "154\n",
      "155\n",
      "156\n",
      "157\n",
      "158\n",
      "159\n",
      "160\n",
      "161\n",
      "162\n",
      "163\n",
      "164\n",
      "165\n",
      "166\n",
      "167\n",
      "168\n",
      "169\n",
      "170\n",
      "171\n",
      "172\n",
      "173\n",
      "174\n",
      "175\n",
      "176\n",
      "177\n",
      "178\n",
      "179\n",
      "180\n",
      "181\n",
      "182\n",
      "183\n",
      "184\n",
      "185\n",
      "186\n",
      "187\n",
      "188\n",
      "189\n",
      "190\n",
      "191\n",
      "192\n",
      "193\n",
      "194\n",
      "195\n",
      "196\n",
      "197\n",
      "198\n",
      "199\n",
      "200\n",
      "201\n",
      "202\n",
      "203\n",
      "204\n",
      "205\n",
      "206\n",
      "207\n",
      "208\n",
      "209\n",
      "210\n",
      "211\n",
      "212\n",
      "213\n",
      "214\n",
      "215\n",
      "216\n",
      "217\n",
      "218\n",
      "219\n",
      "220\n",
      "221\n",
      "222\n",
      "223\n",
      "224\n",
      "225\n",
      "226\n",
      "227\n",
      "228\n",
      "229\n",
      "230\n",
      "231\n",
      "232\n",
      "233\n",
      "234\n",
      "235\n",
      "236\n",
      "237\n",
      "238\n",
      "239\n",
      "240\n",
      "241\n",
      "242\n",
      "243\n",
      "244\n",
      "245\n",
      "246\n",
      "247\n",
      "248\n",
      "249\n",
      "250\n",
      "251\n",
      "252\n",
      "253\n",
      "254\n",
      "255\n",
      "256\n",
      "257\n",
      "258\n",
      "259\n",
      "260\n",
      "261\n",
      "262\n",
      "263\n",
      "264\n",
      "265\n",
      "266\n",
      "267\n",
      "268\n",
      "269\n",
      "270\n",
      "271\n",
      "272\n",
      "273\n",
      "274\n",
      "275\n",
      "276\n",
      "277\n",
      "278\n",
      "279\n",
      "280\n",
      "281\n",
      "282\n",
      "283\n",
      "284\n",
      "285\n",
      "286\n",
      "287\n",
      "288\n",
      "289\n",
      "290\n",
      "291\n",
      "292\n",
      "293\n",
      "294\n",
      "295\n",
      "296\n",
      "297\n",
      "298\n",
      "299\n",
      "300\n",
      "301\n",
      "302\n",
      "303\n",
      "304\n",
      "305\n",
      "306\n",
      "307\n",
      "308\n",
      "309\n",
      "310\n",
      "311\n",
      "312\n",
      "313\n",
      "314\n",
      "315\n",
      "316\n",
      "317\n",
      "318\n",
      "319\n",
      "320\n",
      "321\n",
      "322\n",
      "323\n",
      "324\n",
      "325\n",
      "326\n",
      "327\n",
      "328\n",
      "329\n",
      "330\n",
      "331\n",
      "332\n",
      "333\n",
      "334\n",
      "335\n",
      "336\n",
      "337\n",
      "338\n",
      "339\n",
      "340\n",
      "341\n",
      "342\n",
      "343\n",
      "344\n",
      "345\n",
      "346\n",
      "347\n",
      "348\n",
      "349\n",
      "350\n",
      "351\n",
      "352\n",
      "353\n",
      "354\n",
      "355\n",
      "356\n",
      "357\n",
      "358\n",
      "359\n",
      "360\n",
      "361\n",
      "362\n",
      "363\n",
      "364\n",
      "365\n",
      "366\n",
      "367\n",
      "368\n",
      "369\n",
      "370\n",
      "371\n",
      "372\n",
      "373\n",
      "374\n",
      "375\n",
      "376\n",
      "377\n",
      "378\n",
      "379\n",
      "380\n",
      "381\n",
      "382\n",
      "383\n",
      "384\n",
      "385\n",
      "386\n",
      "387\n",
      "388\n",
      "389\n",
      "390\n",
      "391\n",
      "392\n",
      "393\n",
      "394\n",
      "395\n",
      "396\n",
      "397\n",
      "398\n",
      "399\n",
      "400\n",
      "401\n",
      "402\n",
      "403\n",
      "404\n",
      "405\n",
      "406\n",
      "407\n",
      "408\n",
      "409\n",
      "410\n",
      "411\n",
      "412\n",
      "413\n",
      "414\n",
      "415\n",
      "416\n",
      "417\n",
      "418\n",
      "419\n",
      "420\n",
      "421\n",
      "422\n",
      "423\n",
      "424\n",
      "425\n",
      "426\n",
      "427\n",
      "428\n",
      "429\n",
      "430\n",
      "431\n",
      "432\n",
      "433\n",
      "434\n",
      "435\n",
      "436\n",
      "437\n",
      "438\n",
      "439\n",
      "440\n",
      "441\n",
      "442\n",
      "443\n",
      "444\n",
      "445\n",
      "446\n",
      "447\n",
      "448\n",
      "449\n",
      "450\n",
      "451\n",
      "452\n",
      "453\n",
      "454\n",
      "455\n",
      "456\n",
      "457\n",
      "458\n",
      "459\n",
      "460\n",
      "461\n",
      "462\n",
      "463\n",
      "464\n",
      "465\n",
      "466\n",
      "467\n",
      "468\n",
      "469\n",
      "470\n",
      "471\n",
      "472\n",
      "473\n",
      "474\n",
      "475\n",
      "476\n",
      "477\n",
      "478\n",
      "479\n",
      "480\n",
      "481\n",
      "482\n",
      "483\n",
      "484\n",
      "485\n",
      "486\n",
      "487\n",
      "488\n",
      "489\n",
      "490\n",
      "491\n",
      "492\n",
      "493\n",
      "494\n",
      "495\n",
      "496\n",
      "497\n",
      "498\n",
      "499\n",
      "500\n",
      "501\n",
      "502\n",
      "503\n",
      "504\n",
      "505\n",
      "506\n",
      "507\n",
      "508\n",
      "509\n",
      "510\n",
      "511\n",
      "512\n",
      "513\n",
      "514\n",
      "515\n",
      "516\n",
      "517\n",
      "518\n",
      "519\n",
      "520\n",
      "521\n",
      "522\n",
      "523\n",
      "524\n",
      "525\n",
      "526\n",
      "527\n",
      "528\n",
      "529\n",
      "530\n",
      "531\n",
      "532\n",
      "533\n",
      "534\n",
      "535\n",
      "536\n",
      "537\n",
      "538\n",
      "539\n",
      "540\n",
      "541\n",
      "542\n",
      "543\n",
      "544\n",
      "545\n",
      "546\n",
      "547\n",
      "548\n",
      "549\n",
      "550\n",
      "551\n",
      "552\n",
      "553\n",
      "554\n",
      "555\n",
      "556\n",
      "557\n",
      "558\n",
      "559\n",
      "560\n",
      "561\n",
      "562\n",
      "563\n",
      "564\n",
      "565\n",
      "566\n",
      "567\n",
      "568\n",
      "569\n",
      "570\n",
      "571\n",
      "572\n",
      "573\n",
      "574\n",
      "575\n",
      "576\n",
      "577\n",
      "578\n",
      "579\n",
      "580\n",
      "581\n",
      "582\n",
      "583\n",
      "584\n",
      "585\n",
      "586\n",
      "587\n",
      "588\n",
      "589\n",
      "590\n",
      "591\n",
      "592\n",
      "593\n",
      "594\n",
      "595\n",
      "596\n",
      "597\n",
      "598\n",
      "599\n",
      "600\n",
      "601\n",
      "602\n",
      "603\n",
      "604\n",
      "605\n",
      "606\n",
      "607\n",
      "608\n",
      "609\n",
      "610\n",
      "611\n",
      "612\n",
      "613\n",
      "614\n",
      "615\n",
      "616\n",
      "617\n",
      "618\n",
      "619\n",
      "620\n",
      "621\n",
      "622\n",
      "623\n",
      "624\n",
      "625\n",
      "626\n",
      "627\n",
      "628\n",
      "629\n",
      "630\n",
      "631\n",
      "632\n",
      "633\n",
      "634\n",
      "635\n",
      "636\n",
      "637\n",
      "638\n",
      "639\n",
      "640\n",
      "641\n",
      "642\n",
      "643\n",
      "644\n",
      "645\n",
      "646\n",
      "647\n",
      "648\n",
      "649\n",
      "650\n",
      "651\n",
      "652\n",
      "653\n",
      "654\n",
      "655\n",
      "656\n",
      "657\n",
      "658\n",
      "659\n",
      "660\n",
      "661\n",
      "662\n",
      "663\n",
      "664\n",
      "665\n",
      "666\n",
      "667\n",
      "668\n",
      "669\n",
      "670\n",
      "671\n",
      "672\n",
      "673\n",
      "674\n",
      "675\n",
      "676\n",
      "677\n",
      "678\n",
      "679\n",
      "680\n",
      "681\n",
      "682\n",
      "683\n",
      "684\n",
      "685\n",
      "686\n",
      "687\n",
      "688\n",
      "689\n",
      "690\n",
      "691\n",
      "692\n",
      "693\n",
      "694\n",
      "695\n",
      "696\n",
      "697\n",
      "698\n",
      "699\n",
      "700\n",
      "701\n",
      "702\n",
      "703\n",
      "704\n",
      "705\n",
      "706\n",
      "707\n",
      "708\n",
      "709\n",
      "710\n",
      "711\n",
      "712\n",
      "713\n",
      "714\n",
      "715\n",
      "716\n",
      "717\n",
      "718\n",
      "719\n",
      "720\n",
      "721\n",
      "722\n",
      "723\n",
      "724\n",
      "725\n",
      "726\n",
      "727\n",
      "728\n",
      "729\n",
      "730\n",
      "731\n",
      "732\n",
      "733\n",
      "734\n",
      "735\n",
      "736\n",
      "737\n",
      "738\n",
      "739\n",
      "740\n",
      "741\n",
      "742\n",
      "743\n",
      "744\n",
      "745\n",
      "746\n",
      "747\n",
      "748\n",
      "749\n",
      "750\n",
      "751\n",
      "752\n",
      "753\n",
      "754\n",
      "755\n",
      "756\n",
      "757\n",
      "758\n",
      "759\n",
      "760\n",
      "761\n",
      "762\n",
      "763\n",
      "764\n",
      "765\n",
      "766\n",
      "767\n",
      "768\n",
      "769\n",
      "770\n",
      "771\n",
      "772\n",
      "773\n",
      "774\n",
      "775\n",
      "776\n",
      "777\n",
      "778\n",
      "779\n",
      "780\n",
      "781\n",
      "782\n",
      "783\n",
      "784\n",
      "785\n",
      "786\n",
      "787\n",
      "788\n",
      "789\n",
      "790\n",
      "791\n",
      "792\n",
      "793\n",
      "794\n",
      "795\n",
      "796\n",
      "797\n",
      "798\n",
      "799\n",
      "800\n"
     ]
    }
   ],
   "source": [
    "# PDF下载链接\n",
    "pdf_links=[]\n",
    "link_num = 0\n",
    "\n",
    "for url in href_group_correct:\n",
    "    try:\n",
    "        r = session.get(url)\n",
    "        pdf_link_xpath=r.html.xpath('//*[@id=\"pdfDown\"]/@href')[1]\n",
    "        pdf_links.append(pdf_link_xpath)\n",
    "        link_num += 1\n",
    "        print(link_num)\n",
    "    except:\n",
    "        continue\n",
    "    time.sleep(5)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 40,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 1 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                               PDF下载链接\n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "..                                                 ...\n",
       "795  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "796  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "797  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "798  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "799  https://kns.cnki.net/kcms/download.aspx?filena...\n",
       "\n",
       "[800 rows x 1 columns]"
      ]
     },
     "execution_count": 40,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "pdf_links_correct=['https://kns.cnki.net'+link for link in pdf_links]\n",
    "df_pdf_download=pd.DataFrame({'PDF下载链接':pdf_links_correct})\n",
    "df_pdf_download"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 41,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 2 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "795  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "796  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "797  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "798  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "799  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[800 rows x 2 columns]"
      ]
     },
     "execution_count": 41,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_总=pd.concat([df_link,df_pdf_download],axis=1)\n",
    "df_总"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 42,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>51</td>\n",
       "      <td>基于5G与AI的生态环境监测网络平台探讨</td>\n",
       "      <td>徐爱兰; 耿建生</td>\n",
       "      <td>环境监测管理与技术</td>\n",
       "      <td>2021-06-22</td>\n",
       "      <td>NaN</td>\n",
       "      <td>186.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>52</td>\n",
       "      <td>一种小地质体智能综合方法  网络首发</td>\n",
       "      <td>何文娜;朱长青;徐可;陈圆圆;李仰春</td>\n",
       "      <td>地球物理学进展</td>\n",
       "      <td>2021-06-21 15:33</td>\n",
       "      <td>NaN</td>\n",
       "      <td>87.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>53</td>\n",
       "      <td>能源转型背景下电力系统不确定性及应对方法综述  网络首发</td>\n",
       "      <td>徐潇源;王晗;严正;鲁卓欣;康重庆</td>\n",
       "      <td>电力系统自动化</td>\n",
       "      <td>2021-06-21 13:13</td>\n",
       "      <td>NaN</td>\n",
       "      <td>229.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>54</td>\n",
       "      <td>机器人辅助椎体后凸成形术治疗单/双节段骨质疏松性椎体压缩骨折临床疗效  网络首发</td>\n",
       "      <td>袁伟;孟小童;刘欣春;朱海涛;丛琳</td>\n",
       "      <td>中国修复重建外科杂志</td>\n",
       "      <td>2021-06-21 10:47</td>\n",
       "      <td>NaN</td>\n",
       "      <td>44.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>55</td>\n",
       "      <td>人工智能价值网络下零售企业商业模式创新与企业效益相关性分析</td>\n",
       "      <td>郭漫勤; 师佳英</td>\n",
       "      <td>商业经济研究</td>\n",
       "      <td>2021-06-21</td>\n",
       "      <td>NaN</td>\n",
       "      <td>240.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>795</th>\n",
       "      <td>846</td>\n",
       "      <td>数字经济研究·主持人语</td>\n",
       "      <td>谢康</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>796</th>\n",
       "      <td>847</td>\n",
       "      <td>“一带一路”数字经济的发展图景与法治路径</td>\n",
       "      <td>赵骏</td>\n",
       "      <td>中国法律评论</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>473.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>797</th>\n",
       "      <td>848</td>\n",
       "      <td>智能产业生态系统的结构性特征及发展路径</td>\n",
       "      <td>杜爽</td>\n",
       "      <td>经济纵横</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>144.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>798</th>\n",
       "      <td>849</td>\n",
       "      <td>一纸风行到一端在手——《华西都市报》的转型探析</td>\n",
       "      <td>刘洁</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>799</th>\n",
       "      <td>850</td>\n",
       "      <td>“物联网+人工智能”：Web3.0时代的数字传媒发展初探</td>\n",
       "      <td>冉凌宇</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>241.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>800 rows × 10 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     Unnamed: 0                                        篇名                  作者  \\\n",
       "0            51                      基于5G与AI的生态环境监测网络平台探讨            徐爱兰; 耿建生   \n",
       "1            52                        一种小地质体智能综合方法  网络首发  何文娜;朱长青;徐可;陈圆圆;李仰春   \n",
       "2            53              能源转型背景下电力系统不确定性及应对方法综述  网络首发   徐潇源;王晗;严正;鲁卓欣;康重庆   \n",
       "3            54  机器人辅助椎体后凸成形术治疗单/双节段骨质疏松性椎体压缩骨折临床疗效  网络首发   袁伟;孟小童;刘欣春;朱海涛;丛琳   \n",
       "4            55             人工智能价值网络下零售企业商业模式创新与企业效益相关性分析            郭漫勤; 师佳英   \n",
       "..          ...                                       ...                 ...   \n",
       "795         846                               数字经济研究·主持人语                  谢康   \n",
       "796         847                      “一带一路”数字经济的发展图景与法治路径                  赵骏   \n",
       "797         848                       智能产业生态系统的结构性特征及发展路径                  杜爽   \n",
       "798         849                   一纸风行到一端在手——《华西都市报》的转型探析                  刘洁   \n",
       "799         850              “物联网+人工智能”：Web3.0时代的数字传媒发展初探                 冉凌宇   \n",
       "\n",
       "                  刊名              发表时间  被引     下载  操作  \\\n",
       "0          环境监测管理与技术        2021-06-22 NaN  186.0  下载   \n",
       "1            地球物理学进展  2021-06-21 15:33 NaN   87.0  下载   \n",
       "2            电力系统自动化  2021-06-21 13:13 NaN  229.0  下载   \n",
       "3         中国修复重建外科杂志  2021-06-21 10:47 NaN   44.0  下载   \n",
       "4             商业经济研究        2021-06-21 NaN  240.0  下载   \n",
       "..               ...               ...  ..    ...  ..   \n",
       "795  北京交通大学学报(社会科学版)        2021-04-15 NaN   49.0  下载   \n",
       "796           中国法律评论        2021-04-15 NaN  473.0  下载   \n",
       "797             经济纵横        2021-04-15 NaN  144.0  下载   \n",
       "798             出版广角        2021-04-15 NaN   58.0  下载   \n",
       "799             出版广角        2021-04-15 NaN  241.0  下载   \n",
       "\n",
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "795  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "796  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "797  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "798  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "799  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "795  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "796  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "797  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "798  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "799  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[800 rows x 10 columns]"
      ]
     },
     "execution_count": 42,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_合并=pd.concat([df_url_out,df_总],axis=1)\n",
    "df_合并"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 43,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发</td>\n",
       "      <td>代林序; 张玉洁</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>关于智能化战争的基本认知  网络首发</td>\n",
       "      <td>郭明</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-07-02 15:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>卫星在轨故障案例与人工智能故障诊断  网络首发</td>\n",
       "      <td>王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬</td>\n",
       "      <td>中国空间科学技术</td>\n",
       "      <td>2021-07-02 08:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5</td>\n",
       "      <td>高等职业教育智能生态系统:内涵、结构与实践路径</td>\n",
       "      <td>徐晔</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>845</th>\n",
       "      <td>795</td>\n",
       "      <td>846</td>\n",
       "      <td>数字经济研究·主持人语</td>\n",
       "      <td>谢康</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>846</th>\n",
       "      <td>796</td>\n",
       "      <td>847</td>\n",
       "      <td>“一带一路”数字经济的发展图景与法治路径</td>\n",
       "      <td>赵骏</td>\n",
       "      <td>中国法律评论</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>473.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>847</th>\n",
       "      <td>797</td>\n",
       "      <td>848</td>\n",
       "      <td>智能产业生态系统的结构性特征及发展路径</td>\n",
       "      <td>杜爽</td>\n",
       "      <td>经济纵横</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>144.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>848</th>\n",
       "      <td>798</td>\n",
       "      <td>849</td>\n",
       "      <td>一纸风行到一端在手——《华西都市报》的转型探析</td>\n",
       "      <td>刘洁</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>849</th>\n",
       "      <td>799</td>\n",
       "      <td>850</td>\n",
       "      <td>“物联网+人工智能”：Web3.0时代的数字传媒发展初探</td>\n",
       "      <td>冉凌宇</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>241.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>850 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                                               篇名  \\\n",
       "0        0           1  机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发   \n",
       "1        1           2                               关于智能化战争的基本认知  网络首发   \n",
       "2        2           3                       金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "3        3           4                          卫星在轨故障案例与人工智能故障诊断  网络首发   \n",
       "4        4           5                          高等职业教育智能生态系统:内涵、结构与实践路径   \n",
       "..     ...         ...                                              ...   \n",
       "845    795         846                                      数字经济研究·主持人语   \n",
       "846    796         847                             “一带一路”数字经济的发展图景与法治路径   \n",
       "847    797         848                              智能产业生态系统的结构性特征及发展路径   \n",
       "848    798         849                          一纸风行到一端在手——《华西都市报》的转型探析   \n",
       "849    799         850                     “物联网+人工智能”：Web3.0时代的数字传媒发展初探   \n",
       "\n",
       "                     作者               刊名              发表时间  被引     下载  操作  \\\n",
       "0              代林序; 张玉洁            档案与建设  2021-07-02 16:16 NaN    NaN  下载   \n",
       "1                    郭明        人民论坛·学术前沿  2021-07-02 15:49 NaN    NaN  下载   \n",
       "2         陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN    NaN  下载   \n",
       "3    王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬         中国空间科学技术  2021-07-02 08:49 NaN    NaN  下载   \n",
       "4                    徐晔           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "..                  ...              ...               ...  ..    ...  ..   \n",
       "845                  谢康  北京交通大学学报(社会科学版)        2021-04-15 NaN   49.0  下载   \n",
       "846                  赵骏           中国法律评论        2021-04-15 NaN  473.0  下载   \n",
       "847                  杜爽             经济纵横        2021-04-15 NaN  144.0  下载   \n",
       "848                  刘洁             出版广角        2021-04-15 NaN   58.0  下载   \n",
       "849                 冉凌宇             出版广角        2021-04-15 NaN  241.0  下载   \n",
       "\n",
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "845  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "846  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "847  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "848  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "849  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "845  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "846  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "847  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "848  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "849  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[850 rows x 11 columns]"
      ]
     },
     "execution_count": 43,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "df_总表 = df_首页.append(df_合并).reset_index()\n",
    "df_总表"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 44,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/html": [
       "<div>\n",
       "<style scoped>\n",
       "    .dataframe tbody tr th:only-of-type {\n",
       "        vertical-align: middle;\n",
       "    }\n",
       "\n",
       "    .dataframe tbody tr th {\n",
       "        vertical-align: top;\n",
       "    }\n",
       "\n",
       "    .dataframe thead th {\n",
       "        text-align: right;\n",
       "    }\n",
       "</style>\n",
       "<table border=\"1\" class=\"dataframe\">\n",
       "  <thead>\n",
       "    <tr style=\"text-align: right;\">\n",
       "      <th></th>\n",
       "      <th>index</th>\n",
       "      <th>Unnamed: 0</th>\n",
       "      <th>篇名</th>\n",
       "      <th>作者</th>\n",
       "      <th>刊名</th>\n",
       "      <th>发表时间</th>\n",
       "      <th>被引</th>\n",
       "      <th>下载</th>\n",
       "      <th>操作</th>\n",
       "      <th>详细页链接</th>\n",
       "      <th>PDF下载链接</th>\n",
       "    </tr>\n",
       "  </thead>\n",
       "  <tbody>\n",
       "    <tr>\n",
       "      <th>0</th>\n",
       "      <td>0</td>\n",
       "      <td>1</td>\n",
       "      <td>机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发</td>\n",
       "      <td>代林序; 张玉洁</td>\n",
       "      <td>档案与建设</td>\n",
       "      <td>2021-07-02 16:16</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>1</th>\n",
       "      <td>1</td>\n",
       "      <td>2</td>\n",
       "      <td>关于智能化战争的基本认知  网络首发</td>\n",
       "      <td>郭明</td>\n",
       "      <td>人民论坛·学术前沿</td>\n",
       "      <td>2021-07-02 15:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>2</th>\n",
       "      <td>2</td>\n",
       "      <td>3</td>\n",
       "      <td>金融科技中人工智能技术典型事实与核心规律  网络首发</td>\n",
       "      <td>陈增敬; 严晓东; 冯新伟</td>\n",
       "      <td>中国科学基金</td>\n",
       "      <td>2021-07-02 11:39</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>3</th>\n",
       "      <td>3</td>\n",
       "      <td>4</td>\n",
       "      <td>卫星在轨故障案例与人工智能故障诊断  网络首发</td>\n",
       "      <td>王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬</td>\n",
       "      <td>中国空间科学技术</td>\n",
       "      <td>2021-07-02 08:49</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>4</th>\n",
       "      <td>4</td>\n",
       "      <td>5</td>\n",
       "      <td>高等职业教育智能生态系统:内涵、结构与实践路径</td>\n",
       "      <td>徐晔</td>\n",
       "      <td>中国远程教育</td>\n",
       "      <td>2021-07-02</td>\n",
       "      <td>NaN</td>\n",
       "      <td>NaN</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>...</th>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "      <td>...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>845</th>\n",
       "      <td>795</td>\n",
       "      <td>846</td>\n",
       "      <td>数字经济研究·主持人语</td>\n",
       "      <td>谢康</td>\n",
       "      <td>北京交通大学学报(社会科学版)</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>49.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>846</th>\n",
       "      <td>796</td>\n",
       "      <td>847</td>\n",
       "      <td>“一带一路”数字经济的发展图景与法治路径</td>\n",
       "      <td>赵骏</td>\n",
       "      <td>中国法律评论</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>473.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>847</th>\n",
       "      <td>797</td>\n",
       "      <td>848</td>\n",
       "      <td>智能产业生态系统的结构性特征及发展路径</td>\n",
       "      <td>杜爽</td>\n",
       "      <td>经济纵横</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>144.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>848</th>\n",
       "      <td>798</td>\n",
       "      <td>849</td>\n",
       "      <td>一纸风行到一端在手——《华西都市报》的转型探析</td>\n",
       "      <td>刘洁</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>58.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "    <tr>\n",
       "      <th>849</th>\n",
       "      <td>799</td>\n",
       "      <td>850</td>\n",
       "      <td>“物联网+人工智能”：Web3.0时代的数字传媒发展初探</td>\n",
       "      <td>冉凌宇</td>\n",
       "      <td>出版广角</td>\n",
       "      <td>2021-04-15</td>\n",
       "      <td>NaN</td>\n",
       "      <td>241.0</td>\n",
       "      <td>下载</td>\n",
       "      <td>https://kns.cnki.net/kcms/detail/detail.aspx?d...</td>\n",
       "      <td>https://kns.cnki.net/kcms/download.aspx?filena...</td>\n",
       "    </tr>\n",
       "  </tbody>\n",
       "</table>\n",
       "<p>850 rows × 11 columns</p>\n",
       "</div>"
      ],
      "text/plain": [
       "     index  Unnamed: 0                                               篇名  \\\n",
       "0        0           1  机器学习在档案管理中的应用与挑战——基于新南威尔士州档案馆机器学习实验的调查与启示  网络首发   \n",
       "1        1           2                               关于智能化战争的基本认知  网络首发   \n",
       "2        2           3                       金融科技中人工智能技术典型事实与核心规律  网络首发   \n",
       "3        3           4                          卫星在轨故障案例与人工智能故障诊断  网络首发   \n",
       "4        4           5                          高等职业教育智能生态系统:内涵、结构与实践路径   \n",
       "..     ...         ...                                              ...   \n",
       "845    795         846                                      数字经济研究·主持人语   \n",
       "846    796         847                             “一带一路”数字经济的发展图景与法治路径   \n",
       "847    797         848                              智能产业生态系统的结构性特征及发展路径   \n",
       "848    798         849                          一纸风行到一端在手——《华西都市报》的转型探析   \n",
       "849    799         850                     “物联网+人工智能”：Web3.0时代的数字传媒发展初探   \n",
       "\n",
       "                     作者               刊名              发表时间  被引     下载  操作  \\\n",
       "0              代林序; 张玉洁            档案与建设  2021-07-02 16:16 NaN    NaN  下载   \n",
       "1                    郭明        人民论坛·学术前沿  2021-07-02 15:49 NaN    NaN  下载   \n",
       "2         陈增敬; 严晓东; 冯新伟           中国科学基金  2021-07-02 11:39 NaN    NaN  下载   \n",
       "3    王亚坤;杨凯飞;张婕;郭莉芳;韩笑冬         中国空间科学技术  2021-07-02 08:49 NaN    NaN  下载   \n",
       "4                    徐晔           中国远程教育        2021-07-02 NaN    NaN  下载   \n",
       "..                  ...              ...               ...  ..    ...  ..   \n",
       "845                  谢康  北京交通大学学报(社会科学版)        2021-04-15 NaN   49.0  下载   \n",
       "846                  赵骏           中国法律评论        2021-04-15 NaN  473.0  下载   \n",
       "847                  杜爽             经济纵横        2021-04-15 NaN  144.0  下载   \n",
       "848                  刘洁             出版广角        2021-04-15 NaN   58.0  下载   \n",
       "849                 冉凌宇             出版广角        2021-04-15 NaN  241.0  下载   \n",
       "\n",
       "                                                 详细页链接  \\\n",
       "0    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "1    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "2    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "3    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "4    https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "..                                                 ...   \n",
       "845  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "846  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "847  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "848  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "849  https://kns.cnki.net/kcms/detail/detail.aspx?d...   \n",
       "\n",
       "                                               PDF下载链接  \n",
       "0    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "1    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "2    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "3    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "4    https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "..                                                 ...  \n",
       "845  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "846  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "847  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "848  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "849  https://kns.cnki.net/kcms/download.aspx?filena...  \n",
       "\n",
       "[850 rows x 11 columns]"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "# 将内容表格存在本地\n",
    "with pd.ExcelWriter('知网.xlsx',mode='w',engine=\"openpyxl\") as writer:  \n",
    "            df_总表.to_excel(writer,sheet_name=\"知网\")\n",
    "display(df_总表)"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 爬取refworks"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 45,
   "metadata": {},
   "outputs": [],
   "source": [
    "#回到第一页\n",
    "element = driver.find_element_by_xpath('//*[@id=\"total\"]')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 46,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "1"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "2"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "3"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "4"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "5"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "6"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "7"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "8"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "9"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "#每页50篇文章，下载大于800篇至少需要翻17页，但知网规定一次最多选取500篇，所以这里设置（0，10）\n",
    "for i in range(0,10):\n",
    "    driver.find_element_by_xpath('//*[@id=\"selectCheckAll1\"]').click()\n",
    "    driver.find_element_by_id('PageNext').click()\n",
    "    time.sleep(5)\n",
    "    display(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 47,
   "metadata": {},
   "outputs": [],
   "source": [
    "#定位到要悬停的元素\n",
    "from selenium.webdriver.common.action_chains import ActionChains\n",
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/a')\n",
    "#对定位到的元素执行悬停操作\n",
    "ActionChains(driver).move_to_element(move).perform()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 48,
   "metadata": {},
   "outputs": [],
   "source": [
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/a')\n",
    "ActionChains(driver).move_to_element(move).perform()\n",
    "driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/ul/li[8]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 49,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "['CDwindow-C75A27B0B67D805DDC892DB2ECD948F6',\n",
       " 'CDwindow-C1CAFA10717FF53C58BFD87722DEC54D',\n",
       " 'CDwindow-D404B64CC5FA76F582CA7173A04187A7']"
      ]
     },
     "execution_count": 49,
     "metadata": {},
     "output_type": "execute_result"
    }
   ],
   "source": [
    "## 查看所有的窗口信息\n",
    "driver.window_handles"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 50,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-50-889a0c377e4b>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[2])\n"
     ]
    }
   ],
   "source": [
    "# 切换窗口\n",
    "driver.switch_to_window(driver.window_handles[2])"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 51,
   "metadata": {},
   "outputs": [],
   "source": [
    "# 导出 refworks\n",
    "element=driver.find_element_by_xpath('//*[@id=\"litotxt\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 后300篇"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 52,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-52-7f2dbf209d83>:2: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[1])\n"
     ]
    }
   ],
   "source": [
    "#先回到检索窗口\n",
    "driver.switch_to_window(driver.window_handles[1])\n",
    "#消除原先选定\n",
    "element=driver.find_element_by_xpath('//*[@id=\"gridTable\"]/div[1]/div[2]/div[1]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 53,
   "metadata": {},
   "outputs": [
    {
     "data": {
      "text/plain": [
       "0"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "1"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "2"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "3"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "4"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    },
    {
     "data": {
      "text/plain": [
       "5"
      ]
     },
     "metadata": {},
     "output_type": "display_data"
    }
   ],
   "source": [
    "for i in range(0,6):\n",
    "    driver.find_element_by_xpath('//*[@id=\"selectCheckAll1\"]').click()\n",
    "    driver.find_element_by_id('PageNext').click()\n",
    "    time.sleep(5)\n",
    "    display(i)"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 54,
   "metadata": {},
   "outputs": [],
   "source": [
    "#定位到要悬停的元素\n",
    "from selenium.webdriver.common.action_chains import ActionChains\n",
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/a')\n",
    "#对定位到的元素执行悬停操作\n",
    "ActionChains(driver).move_to_element(move).perform()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 55,
   "metadata": {},
   "outputs": [],
   "source": [
    "move = driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/a')\n",
    "ActionChains(driver).move_to_element(move).perform()\n",
    "driver.find_element_by_xpath('//*[@id=\"batchOpsBox\"]/li[2]/ul/li[1]/ul/li[8]/a').click()"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 56,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-56-0dfe2a1ada8f>:1: DeprecationWarning: use driver.switch_to.window instead\n",
      "  driver.switch_to_window(driver.window_handles[2])\n"
     ]
    }
   ],
   "source": [
    "driver.switch_to_window(driver.window_handles[2])\n"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 57,
   "metadata": {},
   "outputs": [],
   "source": [
    "#导出 refworks\n",
    "element=driver.find_element_by_xpath('//*[@id=\"litotxt\"]/a')\n",
    "element.click()"
   ]
  },
  {
   "cell_type": "markdown",
   "metadata": {},
   "source": [
    "### 下载PDF文件"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 61,
   "metadata": {},
   "outputs": [
    {
     "name": "stderr",
     "output_type": "stream",
     "text": [
      "<ipython-input-61-6a5d60430548>:20: DeprecationWarning: use options instead of chrome_options\n",
      "  driver = webdriver.Chrome(executable_path=r'C:\\Users\\奈奈\\AppData\\Local\\Google\\Chrome\\Application\\chromedriver.exe', chrome_options=options)\n"
     ]
    }
   ],
   "source": [
    "# 准备工作\n",
    "#caps=dict()\n",
    "#caps[\"pageLoadStrategy\"] = \"none\"   # Do not wait for full page load\n",
    "\n",
    "opts = webdriver.ChromeOptions()\n",
    "opts.add_argument('--no-sandbox')#解决DevToolsActivePort文件不存在的报错\n",
    "opts.add_argument('window-size=1920x3000') #指定浏览器分辨率\n",
    "opts.add_argument('--disable-gpu') #谷歌文档提到需要加上一这个属性来规避bug\n",
    "opts.add_argument('--hide-scrollbars') #隐藏滚动条, 应对些特殊页面\n",
    "#opts.add_argument('blink-settings=imagesEnabled=false') #不加载图片, 提升速度\n",
    "#opts.add_argument('--headless') #浏览器不提供可视化页面. linux下如果系统不支持可视化不加这条会启动失败\n",
    "# opts.binary_location = \"C:\\portable\\PortableApps\\IronPortable\\App\\Iron\\chrome.exe\"\n",
    "# opts.binary_location = \"C:\\Program Files\\Google\\Chrome\\Application\\chromedriver.exe\" #\"H:\\_coding_\\Gitee\\InternetNewMedia\\CapstonePrj2016\\chromedriver.exe\"  \n",
    "\n",
    "\n",
    "options = webdriver.ChromeOptions()\n",
    "out_path = r'D:\\大二\\下\\web-mining\\web-cnki\\PDF文档'  # 是你想指定的路径\n",
    "prefs = {'profile.default_content_settings.popups': 0, 'download.default_directory': out_path}\n",
    "options.add_experimental_option('prefs', prefs)\n",
    "driver = webdriver.Chrome(executable_path=r'C:\\Users\\奈奈\\AppData\\Local\\Google\\Chrome\\Application\\chromedriver.exe', chrome_options=options)\n",
    "#driver = webdriver.Chrome( chrome_options = opts) #desired_capabilities=caps"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 62,
   "metadata": {},
   "outputs": [],
   "source": [
    "def base64__api(uname, pwd, img, typeid):\n",
    "    with open(img, 'rb') as f:\n",
    "        base64_data = base64.b64encode(f.read())\n",
    "        b64 = base64_data.decode()\n",
    "    data = {\"username\": uname, \"password\": pwd, \"typeid\": typeid, \"image\": b64}\n",
    "    result = json.loads(requests.post(\"http://api.ttshitu.com/predict\", json=data).text)\n",
    "    if result['success']:\n",
    "        return result[\"data\"][\"result\"]\n",
    "    else:\n",
    "        return result[\"message\"]\n",
    "    return \"\""
   ]
  },
  {
   "cell_type": "code",
   "execution_count": 63,
   "metadata": {},
   "outputs": [
    {
     "name": "stdout",
     "output_type": "stream",
     "text": [
      "中国遥感软件研制进展与发展方向——以像素专家PIE为例----已下载\n",
      "中国遥感软件研制进展与发展方向——以像素专家PIE为例----已下载\n",
      "移动机器人未知环境下无线基站搜索----已下载\n",
      "工业智能化对制造业高质量发展的影响研究----已下载\n",
      "企业文档智能化管理跃迁的依据与方向初探----已下载\n",
      "新冠肺炎疫情下沙特经济社会转型的挑战及其应对----已下载\n",
      "人工智能时代农村集体经济财务管理模式创新研究----已下载\n",
      "工业智能化能促进企业技术创新吗?——基于中国2010—2019年上市公司数据的分析----已下载\n",
      "人工智能政策对我国金融产业效率的影响——基于金融产业资源配置效率视角----已下载\n",
      "基于智慧时代的农业4.0模式及发展策略研究----已下载\n",
      "后疫情时代中国广告产业发展的基本逻辑与进路----已下载\n",
      "人工智能时代无产阶级的历史使命——对赫拉利“无用阶级”理论的批判----已下载\n",
      "中国数字经济现状及未来发展----已下载\n",
      "大数据技术视域下智慧图书馆伦理危机与控制研究----已下载\n",
      "智媒时代县级融媒建设发展的制约瓶颈与应对策略----已下载\n",
      "我国公众智能价值观的现状评估与引领研究——基于2020年智能技术的热点舆情分析----已下载\n",
      "中国智能媒体的使用现状及其反思----已下载\n",
      "人机融合智能：一种新型智能网络和可能的信息交互媒介----已下载\n",
      "学科交叉下的图书馆学----已下载\n",
      "搜索引擎智能推荐的权力控制与人的能动性----已下载\n",
      "新一代人工智能计算模型的创新及其哲学意义----已下载\n",
      "文艺批评：人工智能及其挑战----已下载\n",
      "国家治理的智能化转向及其实施进路----已下载\n",
      "环境分权体制下人工智能对环境污染治理的影响----已下载\n",
      "司法人工智能融入司法改革的难题与路径----已下载\n",
      "人工智能的道德性何以实现?——基于原则导向治理的法治进路----已下载\n",
      "人工智能在乳腺癌组织病理诊断领域的研究进展----已下载\n",
      "大数据时代的裁判思维----已下载\n",
      "机器人自动压铆控制系统设计----已下载\n"
     ]
    }
   ],
   "source": [
    "# 读取上面已保存在本地的xlsx文件【利用里面的pdf下载链接】\n",
    "data = pd.read_excel(\"知网.xlsx\") \n",
    "base = \"https://kns.cnki.net/\"\n",
    "# 开始与结束的链接序号 count end_count\n",
    "count = 421\n",
    "end_count = 450 \n",
    "# 读取title、pdf链接\n",
    "title_list = data[\"篇名\"].to_list()[count:end_count]\n",
    "download_url_list = data[\"PDF下载链接\"].to_list()[count:end_count]\n",
    "list_all_url_list = data[\"详细页链接\"].to_list()[count:end_count]\n",
    "for title,download_url,list_all_url in zip(title_list,download_url_list,list_all_url_list):\n",
    "    try:\n",
    "        # 进入pdf的下载链接\n",
    "        driver.get(download_url)\n",
    "        time.sleep(5)\n",
    "        # 出现验证码的情况\n",
    "        if driver.find_element_by_xpath('//*[@id=\"vImg\"]'):\n",
    "            time.sleep(5)\n",
    "            ele = driver.find_element_by_id('vImg')\n",
    "            ele.screenshot(r'D:\\大二\\下\\web-mining\\web-cnki\\验证码.png')\n",
    "            #截取全屏后定位截图里验证码的位置，并重新裁剪保存\n",
    "            # api识别部分\n",
    "            img_path = r\"D:\\大二\\下\\web-mining\\web-cnki\\验证码.png\"\n",
    "            result = base64_api(uname='gyu', pwd='20001026',img=img_path,typeid=3)\n",
    "            # 输出识别出的验证码\n",
    "            print(\"验证码识别：\",result) \n",
    "            # 将验证码填入\n",
    "            driver.find_element_by_id('vcode').send_keys(result)\n",
    "            time.sleep(5)\n",
    "            # 点击验证码的提交，然后开始下载\n",
    "            driver.find_element_by_xpath('/html/body/div/form/dl/dd/button').click()\n",
    "    except:\n",
    "        print(f'{title}----已下载')\n",
    "        continue"
   ]
  },
  {
   "cell_type": "code",
   "execution_count": null,
   "metadata": {},
   "outputs": [],
   "source": []
  }
 ],
 "metadata": {
  "kernelspec": {
   "display_name": "Python 3",
   "language": "python",
   "name": "python3"
  },
  "language_info": {
   "codemirror_mode": {
    "name": "ipython",
    "version": 3
   },
   "file_extension": ".py",
   "mimetype": "text/x-python",
   "name": "python",
   "nbconvert_exporter": "python",
   "pygments_lexer": "ipython3",
   "version": "3.8.3"
  }
 },
 "nbformat": 4,
 "nbformat_minor": 4
}
